Repository: GrammaTech/gtirb
Branch: master
Commit: eb6a7af1bb97
Files: 357
Total size: 2.2 MB

Directory structure:
gitextract_07t2irr6/

├── .ci/
│   ├── Dockerfile.static
│   ├── Dockerfile.ubuntu20
│   ├── Dockerfile.ubuntu22
│   ├── Dockerfile.ubuntu24
│   ├── PKGBUILD
│   ├── adjust-coverage-paths.py
│   ├── build.py
│   ├── gitlab-ci.yml
│   ├── pre-commit
│   ├── test-install-all.sh
│   ├── test-install-static.sh
│   ├── test-install.cpp
│   ├── test-install.lisp
│   ├── test-install.py
│   └── test-interop.sh
├── .clang-format
├── .clang-tidy
├── .cmake-format.yaml
├── .dockerignore
├── .flake8
├── .github/
│   └── workflows/
│       └── actions.yml
├── .gitignore
├── .gtirb.tex
├── .isort.cfg
├── .lisp-format
├── .pre-commit-config.yaml
├── AlignOf.cmake
├── AuxData.md
├── CHANGELOG.md
├── CMakeLists.googletest
├── CMakeLists.txt
├── CODE_OF_CONDUCT.md
├── CONTRIBUTING.md
├── FAQ.md
├── LICENSE.txt
├── Macros.cmake
├── PROTOBUF.md
├── README.md
├── cl/
│   ├── CMakeLists.txt
│   ├── README.md
│   ├── dot.lisp
│   ├── gtirb.asd
│   ├── gtirb.lisp
│   ├── package.lisp
│   ├── ranged.lisp
│   ├── test.lisp
│   ├── update.lisp
│   ├── utility.lisp
│   ├── validate.lisp
│   └── version.lisp
├── conanfile.py
├── cpack-config.cmake
├── doc/
│   ├── CFG-Edges.md
│   ├── CMakeLists.txt
│   ├── binary-representation.md
│   ├── cl/
│   │   ├── CMakeLists.txt
│   │   └── write-documentation.lisp
│   ├── cpp/
│   │   ├── CMakeLists.txt
│   │   ├── Doxyfile.in
│   │   ├── DoxygenLayout.xml
│   │   └── README.md
│   ├── dot/
│   │   └── gtirb.dot
│   ├── examples/
│   │   ├── CMakeLists.txt
│   │   ├── api-walkthrough.cpp
│   │   ├── cfg-paths.cpp
│   │   ├── cfg-paths.lisp
│   │   ├── cfg-paths.py
│   │   ├── cfgpaths.java
│   │   ├── data-symbols.cpp
│   │   ├── data-symbols.lisp
│   │   ├── data-symbols.py
│   │   ├── datasymbols.java
│   │   ├── functions.cpp
│   │   ├── jumps.cpp
│   │   ├── show-cfg.lisp
│   │   ├── show-cfg.py
│   │   └── stack-stamp.md
│   ├── general/
│   │   ├── AuxDataContainer.md
│   │   ├── Block.md
│   │   ├── ByteBlock.md
│   │   ├── ByteInterval.md
│   │   ├── CFG.md
│   │   ├── CMakeLists.txt
│   │   ├── COMPONENTS.md
│   │   ├── CfgEdge.md
│   │   ├── CfgEdgeLabel.md
│   │   ├── CfgNode.md
│   │   ├── CodeBlock.md
│   │   ├── DataBlock.md
│   │   ├── Doxyfile.in
│   │   ├── DoxygenLayout.xml
│   │   ├── IR.md
│   │   ├── Module.md
│   │   ├── Node.md
│   │   ├── ProxyBlock.md
│   │   ├── Section.md
│   │   ├── SymAddrAddr.md
│   │   ├── SymAddrConst.md
│   │   ├── Symbol.md
│   │   ├── SymbolicExpression.md
│   │   ├── Version.md
│   │   ├── examples.dox
│   │   └── images.dox
│   ├── java/
│   │   └── CMakeLists.txt
│   ├── preprocmd.py
│   └── python/
│       ├── CMakeLists.txt
│       └── conf.py
├── gtirbConfig.cmake.in
├── include/
│   └── gtirb/
│       ├── Addr.hpp
│       ├── Allocator.hpp
│       ├── AuxData.hpp
│       ├── AuxDataContainer.hpp
│       ├── AuxDataSchema.hpp
│       ├── ByteInterval.hpp
│       ├── CFG.hpp
│       ├── Casting.hpp
│       ├── CfgNode.hpp
│       ├── CodeBlock.hpp
│       ├── Context.hpp
│       ├── DataBlock.hpp
│       ├── DecodeMode.hpp
│       ├── ErrorOr.hpp
│       ├── Export.hpp
│       ├── IR.hpp
│       ├── Module.hpp
│       ├── Node.hpp
│       ├── Observer.hpp
│       ├── Offset.hpp
│       ├── ProxyBlock.hpp
│       ├── Section.hpp
│       ├── Symbol.hpp
│       ├── SymbolicExpression.hpp
│       ├── Utility.hpp
│       ├── gtirb.hpp
│       └── version.h.in
├── java/
│   ├── .gitignore
│   ├── CMakeLists.txt
│   ├── Version.java.in
│   ├── build.gradle
│   ├── com/
│   │   └── grammatech/
│   │       └── gtirb/
│   │           ├── AuxDataContainer.java
│   │           ├── AuxDataSchema.java
│   │           ├── AuxDataSchemas.java
│   │           ├── ByteBlock.java
│   │           ├── ByteInterval.java
│   │           ├── CFG.java
│   │           ├── CfiDirective.java
│   │           ├── CodeBlock.java
│   │           ├── DataBlock.java
│   │           ├── Edge.java
│   │           ├── ElfSymbolInfoTuple.java
│   │           ├── ElfSymbolVersionsTable.java
│   │           ├── IR.java
│   │           ├── Module.java
│   │           ├── Node.java
│   │           ├── Offset.java
│   │           ├── PeExportEntry.java
│   │           ├── PeImportEntry.java
│   │           ├── PeResourceEntry.java
│   │           ├── ProbFuncName.java
│   │           ├── ProxyBlock.java
│   │           ├── Section.java
│   │           ├── SectionPropertyTuple.java
│   │           ├── SymAddrAddr.java
│   │           ├── SymAddrConst.java
│   │           ├── Symbol.java
│   │           ├── SymbolicExpression.java
│   │           ├── TreeListItem.java
│   │           ├── TreeListUtils.java
│   │           ├── TypeTableEntry.java
│   │           ├── Util.java
│   │           ├── auxdatacodec/
│   │           │   ├── BoolCodec.java
│   │           │   ├── ByteCodec.java
│   │           │   ├── Codec.java
│   │           │   ├── FloatCodec.java
│   │           │   ├── IntegerCodec.java
│   │           │   ├── ListCodec.java
│   │           │   ├── LongCodec.java
│   │           │   ├── MapCodec.java
│   │           │   ├── OffsetCodec.java
│   │           │   ├── SetCodec.java
│   │           │   ├── ShortCodec.java
│   │           │   ├── StringCodec.java
│   │           │   ├── Tuple1Codec.java
│   │           │   ├── Tuple2Codec.java
│   │           │   ├── Tuple3Codec.java
│   │           │   ├── Tuple4Codec.java
│   │           │   ├── Tuple5Codec.java
│   │           │   ├── UuidCodec.java
│   │           │   ├── Variant11Codec.java
│   │           │   ├── Variant2Codec.java
│   │           │   └── Variant3Codec.java
│   │           ├── tuple/
│   │           │   ├── Tuple1.java
│   │           │   ├── Tuple2.java
│   │           │   ├── Tuple3.java
│   │           │   ├── Tuple4.java
│   │           │   └── Tuple5.java
│   │           └── variant/
│   │               ├── Token.java
│   │               ├── Variant11.java
│   │               ├── Variant2.java
│   │               └── Variant3.java
│   ├── pom.xml.in
│   ├── settings.gradle
│   └── tests/
│       ├── TestAuxData.java
│       ├── TestByteIntervals.java
│       ├── TestIrSanity.java
│       ├── TestModules.java
│       ├── TestSections.java
│       ├── TestSymbolicExpressions.java
│       ├── TestSymbols.java
│       ├── TestTuple.java
│       └── TestVariant.java
├── proto/
│   ├── AuxData.proto
│   ├── ByteInterval.proto
│   ├── CFG.proto
│   ├── CMakeLists.txt
│   ├── CodeBlock.proto
│   ├── DataBlock.proto
│   ├── IR.proto
│   ├── Module.proto
│   ├── Offset.proto
│   ├── ProxyBlock.proto
│   ├── Section.proto
│   ├── Symbol.proto
│   ├── SymbolicExpression.proto
│   └── v0/
│       ├── AuxData.proto
│       ├── AuxDataContainer.proto
│       ├── Block.proto
│       ├── ByteMap.proto
│       ├── CFG.proto
│       ├── CMakeLists.txt
│       ├── DataObject.proto
│       ├── IR.proto
│       ├── ImageByteMap.proto
│       ├── Module.proto
│       ├── Offset.proto
│       ├── ProxyBlock.proto
│       ├── Section.proto
│       ├── Symbol.proto
│       └── SymbolicExpression.proto
├── python/
│   ├── CMakeLists.txt
│   ├── README.md
│   ├── gtirb/
│   │   ├── __init__.py
│   │   ├── auxdata.py
│   │   ├── block.py
│   │   ├── byteinterval.py
│   │   ├── cfg.py
│   │   ├── ir.py
│   │   ├── lazyintervaltree.py
│   │   ├── module.py
│   │   ├── node.py
│   │   ├── offset.py
│   │   ├── proto/
│   │   │   └── __init__.py
│   │   ├── section.py
│   │   ├── serialization.py
│   │   ├── symbol.py
│   │   ├── symbolicexpression.py
│   │   └── util.py
│   ├── mypy.ini.in
│   ├── pyproject.toml.in
│   ├── requirements-dev.txt
│   ├── requirements-mypy.txt
│   ├── stubs/
│   │   ├── README.md
│   │   ├── intervaltree/
│   │   │   ├── __init__.pyi
│   │   │   ├── interval.pyi
│   │   │   └── intervaltree.pyi
│   │   ├── networkx/
│   │   │   ├── __init__.pyi
│   │   │   └── classes/
│   │   │       ├── __init__.pyi
│   │   │       └── multidigraph.pyi
│   │   └── sortedcontainers/
│   │       ├── __init__.pyi
│   │       └── sorteddict.pyi
│   ├── tests/
│   │   ├── hello.gtirb
│   │   ├── helpers.py
│   │   ├── test_auxdata.py
│   │   ├── test_block.py
│   │   ├── test_blocks_at.py
│   │   ├── test_blocks_at_offset.py
│   │   ├── test_blocks_on.py
│   │   ├── test_blocks_on_offset.py
│   │   ├── test_byte_intervals_at.py
│   │   ├── test_byte_intervals_on.py
│   │   ├── test_cfg.py
│   │   ├── test_deep_eq.py
│   │   ├── test_ir.py
│   │   ├── test_module.py
│   │   ├── test_node_from_uuid.py
│   │   ├── test_properties.py
│   │   ├── test_repr.py
│   │   ├── test_section.py
│   │   ├── test_serialization.py
│   │   ├── test_symbolic_expression.py
│   │   ├── test_symbolic_expressions_at.py
│   │   └── test_wrapper.py
│   ├── tox.ini
│   └── version.py.in
├── resources/
│   └── windows_version_resource.rc.in
├── src/
│   ├── AuxData.cpp
│   ├── AuxDataContainer.cpp
│   ├── ByteInterval.cpp
│   ├── CFG.cpp
│   ├── CFGSerialization.hpp
│   ├── CMakeLists.txt
│   ├── CodeBlock.cpp
│   ├── Context.cpp
│   ├── DataBlock.cpp
│   ├── ErrorOr.cpp
│   ├── IR.cpp
│   ├── Module.cpp
│   ├── Node.cpp
│   ├── Offset.cpp
│   ├── ProxyBlock.cpp
│   ├── Section.cpp
│   ├── Serialization.cpp
│   ├── Serialization.hpp
│   ├── Symbol.cpp
│   ├── SymbolicExpression.cpp
│   ├── SymbolicExpressionSerialization.hpp
│   ├── Utility.cpp
│   ├── gtirb/
│   │   └── proto/
│   │       └── CMakeLists.txt
│   └── test/
│       ├── Addr.test.cpp
│       ├── Allocator.test.cpp
│       ├── AuxData.test.cpp
│       ├── AuxDataContainer.test.cpp
│       ├── AuxDataContainerSchema.hpp
│       ├── AuxDataSchemaRegistration.test.cpp
│       ├── ByteInterval.test.cpp
│       ├── CFG.test.cpp
│       ├── CMakeLists.txt
│       ├── CodeBlock.test.cpp
│       ├── DataBlock.test.cpp
│       ├── IR.test.cpp
│       ├── Main.test.cpp
│       ├── Main.test.hpp
│       ├── MergeSortedIterator.test.cpp
│       ├── Module.test.cpp
│       ├── Node.test.cpp
│       ├── Offset.test.cpp
│       ├── PrepDeathTest.hpp
│       ├── PrepTestGTIRB.cpp
│       ├── ProxyBlock.test.cpp
│       ├── Section.test.cpp
│       ├── SerializationTestHarness.hpp
│       ├── Symbol.test.cpp
│       ├── SymbolicExpression.test.cpp
│       ├── TestHelpers.hpp
│       ├── TypedNodeTest.cpp
│       ├── UtilsDeprecatedGlobals.test.cpp
│       ├── UtilsUsingGtirbNamespace.test.cpp
│       ├── config-test.h.in
│       ├── runtests.cmake
│       ├── testInputBinary/
│       │   ├── CMakeLists.txt
│       │   └── TestInputBinary.cpp
│       └── testInterop/
│           ├── CMakeLists.txt
│           ├── test_floats.cpp
│           ├── test_floats.py
│           ├── test_variants.cpp
│           └── test_variants.py
└── version.txt

================================================
FILE CONTENTS
================================================

================================================
FILE: .ci/Dockerfile.static
================================================
FROM ubuntu:20.04

ARG BOOST_VERSION=1_68_0

SHELL ["/bin/bash", "-c"]

# Install apt packages
RUN export DEBIAN_FRONTEND=noninteractive
RUN ln -fs /usr/share/zoneinfo/America/New_York /etc/localtime
RUN apt-get -y update && \
    apt-get -y install \
        autoconf \
        build-essential \
        clang \
        clang-format \
        cmake \
        curl \
        git \
        libprotobuf-dev \
        libprotoc-dev \
        libtool \
        protobuf-compiler \
        unzip \
        wget \
        software-properties-common
RUN TARBALL=boost_${BOOST_VERSION}.tar.bz2 && \
    curl -L https://archives.boost.io/release/1.68.0/source/${TARBALL} \
        -o /tmp/${TARBALL} --fail && \
    tar xf /tmp/${TARBALL} --one-top-level=/tmp && \
    cd /tmp/boost_${BOOST_VERSION} && \
    ./bootstrap.sh --prefix=/usr/local && \
    ./b2 include=/usr/include/python3.8 link=static install && \
    cd / && \
    rm -rf /tmp/${TARBALL} /tmp/boost_${BOOST_VERSION}


================================================
FILE: .ci/Dockerfile.ubuntu20
================================================
FROM ubuntu:20.04

# Install apt packages
ENV VIRTUAL_ENV=/opt/venv
ENV PATH="$VIRTUAL_ENV/bin:$PATH"
RUN apt-get -y update && \
    DEBIAN_FRONTEND=noninteractive \
    apt-get -y install \
        autoconf \
        build-essential \
        clang \
        clang-format \
        cmake \
        curl \
        default-jdk \
        doxygen \
        elpa-paredit \
        emacs-nox \
        git \
        graphviz \
        libprotobuf-dev \
        libprotoc-dev \
        libtool \
        libboost-dev \
        maven \
        protobuf-compiler \
        python3 \
        python3-pip \
        python3-setuptools \
        python3-venv \
        wget \
        software-properties-common \
        sbcl \
        slime && \
    python3 -m venv $VIRTUAL_ENV && \
    python3 -m pip install --upgrade pip

# The default version of maven from the ubuntu repositories contains a bug that
# causes warnings about illegal reflective accesses. The build on apache's
# website fixes this bug, so we use that build instead.
RUN wget https://archive.apache.org/dist/maven/maven-3/3.9.3/binaries/apache-maven-3.9.3-bin.tar.gz -P /tmp
RUN tar xf /tmp/apache-maven-*.tar.gz -C /opt
RUN update-alternatives --install /usr/bin/mvn mvn /opt/apache-maven-3.9.3/bin/mvn 392

# Install python dependencies
COPY python/requirements-dev.txt /tmp/requirements-dev.txt
RUN pip3 install -r /tmp/requirements-dev.txt


================================================
FILE: .ci/Dockerfile.ubuntu22
================================================
FROM ubuntu:22.04

ENV VIRTUAL_ENV=/opt/venv
ENV PATH="$VIRTUAL_ENV/bin:$PATH"
RUN apt-get -y update && \
    DEBIAN_FRONTEND=noninteractive \
    apt-get -y install \
        autoconf \
        build-essential \
        clang \
        clang-format \
        cmake \
        curl \
        default-jdk \
        doxygen \
        elpa-paredit \
        emacs-nox \
        git \
        graphviz \
        libprotobuf-dev \
        libprotoc-dev \
        libtool \
        libboost-dev \
        maven \
        protobuf-compiler \
        python3 \
        python3-pip \
        python3-setuptools \
        python3-venv \
        wget \
        software-properties-common \
        sbcl \
        slime && \
    python3 -m venv $VIRTUAL_ENV && \
    python3 -m pip install --upgrade pip

COPY python/requirements-dev.txt /tmp/requirements-dev.txt
RUN pip3 install -r /tmp/requirements-dev.txt


================================================
FILE: .ci/Dockerfile.ubuntu24
================================================
FROM ubuntu:24.04

ENV VIRTUAL_ENV=/opt/venv
ENV PATH="$VIRTUAL_ENV/bin:$PATH"
RUN apt-get -y update && \
    DEBIAN_FRONTEND=noninteractive \
    apt-get -y install \
        autoconf \
        build-essential \
        clang \
        clang-format \
        cmake \
        curl \
        default-jdk \
        doxygen \
        elpa-paredit \
        emacs-nox \
        git \
        graphviz \
        libprotobuf-dev \
        libprotoc-dev \
        libtool \
        libboost-dev \
        # As of 24.04.1 LTS, the clang package depends on libstdc++-13-dev but
        # appears to be compiled for libstdc++-14-dev, which we need to install
        # explicitly here.
        libstdc++-14-dev \
        maven \
        protobuf-compiler \
        python3 \
        python3-pip \
        python3-setuptools \
        python3-venv \
        wget \
        software-properties-common \
        sbcl \
        slime && \
    python3 -m venv $VIRTUAL_ENV && \
    python3 -m pip install --upgrade pip

COPY python/requirements-dev.txt /tmp/requirements-dev.txt
RUN pip3 install -r /tmp/requirements-dev.txt


================================================
FILE: .ci/PKGBUILD
================================================
# Contributor: Eric Schulte <eschulte@grammatech.com>
# Maintainer: Eric Schulte <eschulte@grammatech.com>
_srcname=gtirb
pkgname=gtirb-git
pkgver=v1.4.7.r0.gb3094954
pkgrel=1
pkgdesc="GrammaTech Intermediate Representation for Binaries"
arch=('x86_64')
url="https://github.com/grammatech/gtirb"
license=('MIT')
depends=('protobuf' 'python-networkx')
makedepends=('git' 'cmake' 'python' 'doxygen' 'graphviz' 'boost')
provides=('gtirb')
source=('git://github.com/grammatech/gtirb.git')
sha512sums=('SKIP')

pkgver() {
  cd "$_srcname"
  git describe --long --tags --exclude "gt/*" | sed 's/\([^-]*-g\)/r\1/;s/[-:/ ]/./g'
}

build() {
    cd "$_srcname/"
    cmake . -Bbuild -DCMAKE_INSTALL_PREFIX=/usr -DGTIRB_CL_API=OFF \
      -DCMAKE_BUILD_TYPE=${BUILD_TYPE-RelWithDebInfo} \
      -DCMAKE_CXX_COMPILER=${COMPILER-g++}
    cmake --build build --target all doc
}

package() {
  cd "$_srcname/"
  make -Cbuild DESTDIR="$pkgdir" install
  mkdir -p "$pkgdir"/usr/share/doc/$_srcname
  cp -R build/doc/html/ "$pkgdir"/usr/share/doc/$_srcname
}


================================================
FILE: .ci/adjust-coverage-paths.py
================================================
#!/usr/bin/env python3

import os
from argparse import ArgumentParser
from pathlib import Path
from xml.etree import ElementTree

parser = ArgumentParser(
    description="""
    Adjusts the source paths in coverage.xml to satisfy GitLab's expectations.
    Specifically, it removes the build tree prefix from the sources and
    replaces it with the source tree prefix. These prefixes are determined via
    command-line arguments or CI environment variables.
    """
)
parser.add_argument(
    "coverage",
    metavar="coverage.xml",
    type=Path,
    help="path of cobertura coverage file to fix",
)
group = parser.add_mutually_exclusive_group(required=True)
group.add_argument(
    "-i", "--in-place", action="store_true", help="rewrite coverage in place"
)
group.add_argument(
    "-o", "--output", metavar="file", help="write modified coverage to file"
)
parser.add_argument(
    "--source-dir",
    metavar="path",
    default=os.environ.get("CI_PROJECT_DIR"),
    help="root of the GTIRB repository",
)
parser.add_argument(
    "--build-dir",
    metavar="path",
    type=Path,
    help="path where coverage was run (default coverage.xml parent directory)",
)
args = parser.parse_args()

if args.source_dir is None:
    parser.error("either --source-dir or CI_PROJECT_DIR is required")
args.source_dir = Path(args.source_dir).resolve()

if args.build_dir is None:
    args.build_dir = args.coverage.parent
args.build_dir = args.build_dir.resolve()

et = ElementTree.parse(args.coverage)
for source in et.iter("source"):
    if source.text:
        relpath = Path(source.text).relative_to(args.build_dir)
        fixed = str(Path(args.source_dir, relpath))
        print("mapping", source.text, "to", fixed)
        source.text = fixed

if args.output:
    et.write(args.output)
else:
    et.write(args.coverage)


================================================
FILE: .ci/build.py
================================================
#!/usr/bin/env python
import subprocess
import sys

import conanfile


def run_conan(args):
    cmd = ["conan"] + args
    print("running: %s" % " ".join(cmd))
    sys.stdout.flush()
    subprocess.check_call(cmd)


def build(argv):
    props = conanfile.Properties()
    run_conan(["create", ".", props.conan_ref] + argv)
    archived_channels = props.archived_channels
    if props.conan_channel in archived_channels:
        run_conan(
            ["upload", props.conan_recipe, "--all", "--remote", "gitlab"]
        )
    else:
        print(
            "Conan channel not archived. Update archived_branches in "
            "conanfile.py to get archival."
        )
        print("archived channels: ")
        print(*archived_channels, sep=", ")
        print("channel built: " + props.conan_channel)


if __name__ == "__main__":
    build(sys.argv[1:])


================================================
FILE: .ci/gitlab-ci.yml
================================================
variables:
  # The IMAGE_TAG is derived from the branch name so that if a branch modifies
  # the CI images, it builds and runs using the new images without conflicting
  # with master.
  IMAGE_TAG: "$CI_COMMIT_REF_SLUG"
  GIT_SUBMODULE_STRATEGY: recursive
  EXTRA_INDEX_URL: https://__token__:$GL_PKG_API_TOKEN@git.grammatech.com/api/v4/projects/1587/packages/pypi/simple
  # The follow two variables are used by the package-uploader.
  PROJECT_ID: $CI_PROJECT_ID
  PIPELINE_ID: $CI_PIPELINE_ID
  CONAN_PASSWORD: $CI_JOB_TOKEN
  CONAN_VERSION: "1.59"
  # Limit build parallelism to avoid overwhelming CI servers.
  MAKE_JOBS: 8

stages:
  - build-images
  - prebuild
  - build
  - build-installers
  - test-setup
  - test-packages1
  - test-packages2
  - deploy
  - deploy-apt
  - upload

default:
  tags: [shared]

.build-ci-image: &build-ci-image
  stage: build-images
  image:
    name: quay.io/buildah/stable
  script:
    # Configure authentication credentials for GitLab
    - buildah login -u "$CI_REGISTRY_USER" -p "$CI_REGISTRY_PASSWORD" "$CI_REGISTRY"
    - buildah login -u "$DOCKERHUB_USERNAME" -p "$DOCKERHUB_PASSWORD" https://index.docker.io/v1/
    # Build our image (using a cache if available)
    - >-
      buildah build
      -f "$CI_PROJECT_DIR/$DOCKERFILE_PATH"
      --cache-from "$DOCKER_REGISTRY/$CI_PROJECT_PATH/$IMAGE_NAME/cache"
      --cache-to "$DOCKER_REGISTRY/$CI_PROJECT_PATH/$IMAGE_NAME/cache"
      --layers
      --tag "$DOCKER_REGISTRY/$CI_PROJECT_PATH/$IMAGE_NAME:$IMAGE_TAG"
      "$CI_PROJECT_DIR"
    # Push to our internal registry
    - buildah push "$DOCKER_REGISTRY/$CI_PROJECT_PATH/$IMAGE_NAME:$IMAGE_TAG"
    # If we're on the master branch, also push the latest tag.
    - >-
      if [ "$CI_COMMIT_BRANCH" = "$CI_DEFAULT_BRANCH" ]; then
        buildah push "$DOCKER_REGISTRY/$CI_PROJECT_PATH/$IMAGE_NAME:$IMAGE_TAG" \
            "$DOCKER_REGISTRY/$CI_PROJECT_PATH/$IMAGE_NAME:latest"
      fi

build-ci-image-ubuntu20:
  <<: *build-ci-image
  variables:
    DOCKERFILE_PATH: .ci/Dockerfile.ubuntu20
    IMAGE_NAME: ubuntu20

build-ci-image-ubuntu22:
  <<: *build-ci-image
  variables:
    DOCKERFILE_PATH: .ci/Dockerfile.ubuntu22
    IMAGE_NAME: ubuntu22

build-ci-image-ubuntu24:
  <<: *build-ci-image
  variables:
    DOCKERFILE_PATH: .ci/Dockerfile.ubuntu24
    IMAGE_NAME: ubuntu24

build-ci-image-static:
  <<: *build-ci-image
  variables:
    DOCKERFILE_PATH: .ci/Dockerfile.static
    IMAGE_NAME: static

check-format:
  stage: prebuild
  image: $DOCKER_REGISTRY/rewriting/gtirb/ubuntu20:$IMAGE_TAG
  script:
    - |+
      pre-commit run --all-files --show-diff-on-failure || ( (cat <<EOF
      ================================================================================
      If this stage fails, the formatting of your changes may be incorrect.
      To automatically format your files, install pre-commit:
          pip3 install pre-commit
          pre-commit install
      pre-commit will now automatically format any files before commit.
      To fix any misformatted files, run:
          pre-commit run --all-files
      And then commit any changes.
      More information regarding pre-commit can be found at https://pre-commit.com.

      NOTE FOR PROJECTS WITH C/C++ CODE:
      pre-commit will by default use the correct version of every formatting tool
      EXCEPT FOR clang-format. You need to ensure the version of clang-format you
      use is EXACTLY version 10.0.0. This is available in Ubuntu 20 by default.

      See also:
          https://git.grammatech.com/research/meta/-/wikis/infrastructure/infrastructure#running-ci-jobs-locally-for-debugging
          http://otsego.grammatech.com/u4/Videos/2020-09-11-Lunchtime-Seminar/
      ================================================================================
      EOF
      ) && exit 1)

build-docs:
  stage: build
  image: $DOCKER_REGISTRY/rewriting/gtirb/ubuntu24:$IMAGE_TAG
  artifacts:
    name: "$CI_COMMIT_REF_NAME-$CI_JOB_NAME"
    paths:
      - html
  script:
    - pip install -r python/requirements-dev.txt -r python/requirements-mypy.txt
    - cmake -Bbuild . -DGTIRB_ENABLE_TESTS=OFF
    - cd build
    - pip install ./python/
    - make doc
    - mv doc/html ..

.build-template: &build
  stage: build
  image: $DOCKER_REGISTRY/rewriting/gtirb/$IMAGE_NAME:$IMAGE_TAG
  artifacts:
    name: "$CI_COMMIT_REF_NAME-$CI_JOB_NAME"
    paths:
      - build
  script:
    - mkdir build
    - cd build
    - RELEASE_VERSION=OFF
    - '[[ ! $CI_COMMIT_REF_NAME =~ ^release-.* ]] || RELEASE_VERSION=ON'
    - >
      cmake ../
      -DCMAKE_BUILD_TYPE=$BUILD_TYPE
      -DCMAKE_CXX_COMPILER=${CXX_COMPILER:-g++}
      -DCPACK_DEBIAN_PACKAGE_RELEASE="$(lsb_release -sc)"
      -DENABLE_CODE_COVERAGE=${ENABLE_CODE_COVERAGE:-OFF}
      -DGTIRB_BUILD_SHARED_LIBS=${GTIRB_BUILD_SHARED_LIBS:-ON}
      -DGTIRB_PACKAGE_POLICY=$PACKAGE_POLICY
      -DGTIRB_RELEASE_VERSION=$RELEASE_VERSION
      -DGTIRB_STRIP_DEBUG_SYMBOLS=On
      -DGTIRB_CL_API=${GTIRB_CL_API:-OFF}
      -DGTIRB_CXX_API=${GTIRB_CXX_API:-OFF}
      -DGTIRB_JAVA_API=${GTIRB_JAVA_API:-OFF}
      -DGTIRB_PY_API=${GTIRB_PY_API:-OFF}
    - make -j${MAKE_JOBS}
    - ctest --output-on-failure

build-ubuntu20-gcc:
  variables:
    IMAGE_NAME: 'ubuntu20'
    GTIRB_CXX_API: 'ON'
    CXX_COMPILER: 'g++'
    CPACK_GENERATOR: 'DEB'
    BUILD_TYPE: 'RelWithDebInfo'
    PACKAGE_POLICY: "unix"
  <<: *build

build-ubuntu22-gcc:
  variables:
    IMAGE_NAME: 'ubuntu22'
    GTIRB_CXX_API: 'ON'
    CXX_COMPILER: 'g++'
    CPACK_GENERATOR: 'DEB'
    BUILD_TYPE: 'RelWithDebInfo'
    PACKAGE_POLICY: "unix"
  <<: *build

build-ubuntu24-gcc:
  variables:
    IMAGE_NAME: 'ubuntu24'
    GTIRB_CXX_API: 'ON'
    CXX_COMPILER: 'g++'
    CPACK_GENERATOR: 'DEB'
    BUILD_TYPE: 'RelWithDebInfo'
    PACKAGE_POLICY: "unix"
  <<: *build

build-ubuntu24-gcc-debug:
  variables:
    IMAGE_NAME: 'ubuntu24'
    GTIRB_CXX_API: 'ON'
    CXX_COMPILER: 'g++'
    BUILD_TYPE: 'Debug'
    PACKAGE_POLICY: "unix"
  <<: *build

build-ubuntu24-clang-debug:
  variables:
    IMAGE_NAME: 'ubuntu24'
    GTIRB_CXX_API: 'ON'
    CXX_COMPILER: 'clang++'
    BUILD_TYPE: 'Debug'
    PACKAGE_POLICY: "unix"
  <<: *build

build-static:
  variables:
    IMAGE_NAME: 'static'
    GTIRB_CXX_API: 'ON'
    CXX_COMPILER: 'g++'
    BUILD_TYPE: 'RelWithDebInfo'
    GTIRB_BUILD_SHARED_LIBS: 'OFF'
  <<: *build

build-java:
  variables:
    IMAGE_NAME: 'ubuntu24'
    GTIRB_JAVA_API: 'ON'
  <<: *build

build-lisp:
  variables:
    IMAGE_NAME: 'ubuntu20'
    GTIRB_CL_API: 'ON'
  <<: *build

build-ubuntu20-python:
  variables:
    IMAGE_NAME: 'ubuntu20'
    GTIRB_PY_API: 'ON'
  <<: *build

build-ubuntu24-python:
  variables:
    IMAGE_NAME: 'ubuntu24'
    GTIRB_PY_API: 'ON'
  <<: *build

generate-coverage:
  variables:
    IMAGE_NAME: 'ubuntu24'
    BUILD_TYPE: 'Debug'
    CXX_COMPILER: 'g++'
    ENABLE_CODE_COVERAGE: 'ON'
    GTIRB_CXX_API: 'ON'
    GTIRB_PY_API: 'ON'
  artifacts:
    # Upload coverage reports and source for report-coverage-* jobs to use.
    paths:
      - build/**/*.gcno
      - build/**/*.gcda
      - build/python/.coverage*
      - build/**/*.py
      - build/**/*.h
      - build/**/*.cc
      - build/**/*.cpp
  before_script:
    - pip install "gcovr>=8.6" coverage
  <<: *build

# > If there is more than one matched line in the job output, the last line is used
# https://docs.gitlab.com/ee/ci/yaml/index.html#coverage
# We output the two coverage numbers in separate jobs(report-coverage-*) so
# that both can be reported to GitLab.
report-coverage-cpp:
  stage: build
  needs: [generate-coverage]
  image: $DOCKER_REGISTRY/rewriting/gtirb/ubuntu24:$IMAGE_TAG
  coverage: '/^TOTAL.*\s+(\d+\%)$/'
  script:
    - pip install "gcovr>=8.6"
    - cd build
    - gcovr --exclude=googletest-src --exclude=doc --exclude=..*/proto --exclude=..*/test --root ..

report-coverage-py:
  stage: build
  needs: [generate-coverage]
  image: $DOCKER_REGISTRY/rewriting/gtirb/ubuntu24:$IMAGE_TAG
  coverage: '/^TOTAL.*\s+(\d+\%)$/'
  artifacts:
    reports:
      coverage_report:
        coverage_format: cobertura
        path: build/python/coverage.xml
  script:
    - pip install -r python/requirements-dev.txt
    - cd build/python
    - tox run -e report
    - ../../.ci/adjust-coverage-paths.py --in-place coverage.xml --build-dir ..


# The build artifact timestamps may be out-of-date relative to the newly cloned
# repository for later jobs. These commands will update the timestamps to bring
# them up to date without actually building much. This is significantly faster
# than rebuilding out-of-date files in the later jobs.
.update-artifact-timestamps: &update-artifact-timestamps
  - make -C build --touch

python-wheel:
  stage: build-installers
  needs: [build-ubuntu24-python]
  image: $DOCKER_REGISTRY/rewriting/gtirb/ubuntu24:$IMAGE_TAG
  artifacts:
    name: "$CI_COMMIT_REF_NAME-$CI_JOB_NAME"
    paths:
      - gtirb-*-py*-none-any.whl
  script:
    - *update-artifact-timestamps
    - pip3 wheel --no-deps build/python

python-wheel-unstable:
  stage: build-installers
  needs: [python-wheel]
  image: $DOCKER_REGISTRY/rewriting/gtirb/ubuntu24:$IMAGE_TAG
  rules:
    - if: '$CI_COMMIT_BRANCH == "master"'
  artifacts:
    name: "$CI_COMMIT_REF_NAME-$CI_JOB_NAME"
    paths:
      - gtirb-unstable-py3-none-any.whl
  script:
    - cp gtirb-*-py*-none-any.whl ./gtirb-unstable-py3-none-any.whl

test-capstone-example:
  stage: test-packages1
  image: $DOCKER_REGISTRY/rewriting/gtirb/ubuntu24:$IMAGE_TAG
  needs: ['build-ubuntu24-gcc']
  script:
    - *update-artifact-timestamps
    - cd build
    - '[[ ! -f bin/ex-jumps ]]'
    - apt-get install -y libcapstone-dev
    - cmake ..
    - make -j${MAKE_JOBS}
    - '[[ -f bin/ex-jumps ]]'

test-default-install:
  stage: test-packages1
  image: $DOCKER_REGISTRY/rewriting/gtirb/$IMAGE_NAME:$IMAGE_TAG
  variables:
    IMAGE_NAME: 'ubuntu24'
    COMPILER: 'g++-9'
  needs: ['build-ubuntu24-gcc']
  script:
    - *update-artifact-timestamps
    - make -C build install && rm -rf build
    - LD_LIBRARY_PATH=/usr/local/lib:$LD_LIBRARY_PATH .ci/test-install-all.sh

test-default-install-static:
  stage: test-packages1
  image: $DOCKER_REGISTRY/rewriting/gtirb/static:$IMAGE_TAG
  needs: ['build-static']
  script:
    - *update-artifact-timestamps
    - '[ -e build/lib/libgtirb.a ]'
    - '[ ! -e build/lib/libgtirb.so ]'
    - make -C build install
    - rm -rf build
    - LD_LIBRARY_PATH=/usr/local/lib:$LD_LIBRARY_PATH .ci/test-install-static.sh

test-install-different-prefix:
  stage: test-packages1
  image: $DOCKER_REGISTRY/rewriting/gtirb/$IMAGE_NAME:$IMAGE_TAG
  variables:
    IMAGE_NAME: 'ubuntu24'
    COMPILER: 'g++-9'
  needs: ['build-ubuntu24-gcc']
  script:
    - *update-artifact-timestamps
    - cmake . -B build -DCMAKE_INSTALL_PREFIX=/tmp/prefix
    - make -C build install
    - rm -rf build
    - >
      CPPFLAGS=-I/tmp/prefix/include
      LDFLAGS=-L/tmp/prefix/lib
      LD_LIBRARY_PATH=/tmp/prefix/lib
      .ci/test-install-all.sh

test-install-with-destdir:
  stage: test-packages1
  image: $DOCKER_REGISTRY/rewriting/gtirb/$IMAGE_NAME:$IMAGE_TAG
  variables:
    IMAGE_NAME: 'ubuntu24'
    COMPILER: 'g++-9'
  needs: ['build-ubuntu24-gcc']
  script:
    - *update-artifact-timestamps
    - DESTDIR=/tmp/destdir make -C ./build install
    - >
      CPPFLAGS=-I/tmp/destdir/usr/local/include
      LDFLAGS=-L/tmp/destdir/usr/local/lib
      LD_LIBRARY_PATH=/tmp/destdir/usr/local/lib
      .ci/test-install-all.sh

test-interop:
  stage: test-packages1
  needs: ['build-ubuntu24-gcc', 'python-wheel']
  image: ${DOCKER_REGISTRY}/rewriting/gtirb/ubuntu24:$IMAGE_TAG
  script:
    - *update-artifact-timestamps
    - pip3 install gtirb-*-py*-none-any.whl
    - .ci/test-interop.sh

.conan-linux: &conan-linux
  stage: deploy
  needs: [check-format]
  image: $DOCKER_REGISTRY/rewriting/gtirb/$IMAGE_NAME:$IMAGE_TAG
  script:
    - python3 -m pip install --upgrade conan~=$CONAN_VERSION
    - conan profile new default --detect
    - conan profile update settings.compiler.libcxx=libstdc++11 default
    - conan remote add gitlab ${CI_API_V4_URL}/packages/conan
    - conan user ci_user -r gitlab -p
    - export PYTHONPATH="$(pwd)"
    - python3 .ci/build.py

conan-linux-gcc9:
  variables:
    IMAGE_NAME: ubuntu20
  <<: *conan-linux

conan-linux-gcc11:
  variables:
    IMAGE_NAME: ubuntu22
  <<: *conan-linux

.conan-windows: &conan-windows
  stage: deploy
  needs: [check-format]
  tags: [ddisasm-windows]
  artifacts:
    name: "$CI_COMMIT_REF_NAME-$CI_JOB_NAME"
    paths:
      - gtirb*.zip
  script:
    # Setting CI_PROJECT_DIR to $(pwd) because CI doesn't properly set CI_PROJECT_DIR with VirtualBox runners.
    - export CI_PROJECT_DIR=`cygpath -w $(pwd)`
    # Initialize
    - systeminfo
    - python -m pip install --upgrade conan~=$CONAN_VERSION
    - export PYTHONPATH=$CI_PROJECT_DIR
    # Setup Remote and Authenticate
    - conan remote add gitlab ${CI_API_V4_URL}/packages/conan
    - conan user ci_user -r gitlab -p
    # Build
    - export GTIRB_DISABLE_PARALLEL_BUILD=1
    - python .ci/build.py -s build_type=$BUILD_TYPE
    # Install
      # Python print() on Windows returns CRLF and will cause issues in CI - use "print('string', end='')" when outputting from python.
    - export PKG_INSTALL_NAME=`python -c "import conanfile; print(conanfile.Properties().conan_recipe, end='')"`
    - conan install $PKG_INSTALL_NAME -g deploy --build=missing --install-folder="./packages"
    # Package
    - export PKG_NAME=`conan inspect . --raw name`
    - export PKG_VERSION=`conan inspect . --raw version`
    - export PKG_ARCH=`uname -m`
    - cd ./packages
      # Library Package
    - export PKG_FILENAME="${CI_PROJECT_DIR}\\${PKG_NAME}-${PKG_VERSION}.win10.${PKG_ARCH}.zip"
    - export PKG_MANIFEST=(
        "gtirb/bin/gtirb.dll"
        "gtirb/licenses/LICENSE.txt"
      )
    - zip -r $PKG_FILENAME ${PKG_MANIFEST[@]}
      # Development Package
    - export PKG_FILENAME_DEV="${CI_PROJECT_DIR}\\${PKG_NAME}-dev-${PKG_VERSION}.win10.${PKG_ARCH}.zip"
    - export PKG_MANIFEST_DEV=(
        "${PKG_MANIFEST[@]}"
        "gtirb/lib/gtirb.lib"
        "gtirb/include/gtirb"
      )
    - zip -r $PKG_FILENAME_DEV ${PKG_MANIFEST_DEV[@]}

conan-windows-debug:
  variables:
    BUILD_TYPE: Debug
  <<: *conan-windows

conan-windows-release:
  variables:
    BUILD_TYPE: Release
  <<: *conan-windows

conan-windows-32:
  stage: deploy
  tags: [ddisasm-windows]
  needs: []
  variables:
    ARCHITECTURE: x64
  script:
    - systeminfo
    - export PATH="C:\\Program Files\\Python38;$PATH"
    - export PYTHONPATH="$(cygpath -w $(pwd))"
    # Install conan
    - python -m pip install --upgrade conan~=$CONAN_VERSION
    # Setup Remote and Authenticate
    - conan remote add gitlab ${CI_API_V4_URL}/packages/conan
    - conan user ci_user -r gitlab -p
    # The boost options disable building boost with libiconv.  This is important, because we can't get the package to build with --build=libiconv.
    - CI_PROJECT_DIR=$(cygpath -w $(pwd)) python .ci/build.py -s arch=x86 -s compiler.runtime=MT --build=protobuf -o protobuf:with_zlib=False --build=gtirb --build=boost -o boost:zlib=False -o boost:bzip2=False -o boost:without_locale=True -o boost:without_log=True --build=missing

external-pypi:
  stage: deploy
  needs: [build-ubuntu24-gcc, python-wheel]
  image: $DOCKER_REGISTRY/rewriting/gtirb/ubuntu24:$IMAGE_TAG
  rules:
    - if: '$CI_COMMIT_REF_NAME =~ /^release-.*/'
  script:
    - pip3 install twine wheel setuptools pkginfo --upgrade
    - pip3 install gtirb-*-py*-none-any.whl
    - GTIRB_VERSION=$(python3 -c "import gtirb; print(gtirb.__version__)")
    # We won't be releasing our dev packages externally, so fail if this is a
    # .dev package.
    - if [[ "$GTIRB_VERSION" =~ \.dev[[:digit:]]*(\+.*)?$ ]]; then exit 1; fi
    - twine check gtirb-*-py*-none-any.whl
    - twine upload gtirb-*-py*-none-any.whl -u __token__ -p $PYPI_API_KEY

# On master, we only upload and overwrite `.dev` versions of the python
# package.  Non-.dev versions should only be uploaded on versioned
# release-.* branches.  This is so the versioning of our python packages
# coincides with that of our conan packages, where dev packages are
# produced from master, and stable, versioned packages are produced
# on release-.* branches.
internal-pypi:
  stage: deploy
  needs: [build-ubuntu24-gcc, python-wheel]
  image: python:3.9
  rules:
    - if: '$CI_COMMIT_BRANCH == "master"'
    - if: '$CI_COMMIT_REF_NAME =~ /^release-.*/'
  script:
    - pip3 install twine wheel setuptools pkginfo --upgrade
    - wget https://git.grammatech.com/research/templates/python-module/raw/master/.pypirc
    - sed "s/password = <access token>/password = $GL_PKG_API_TOKEN/" .pypirc > ~/.pypirc
    - pip3 install gtirb-*-py*-none-any.whl
    - NEW_VERSION=$(python3 -c "import gtirb; print(gtirb.__version__)")
    - if [[ "$NEW_VERSION" =~ \.dev[[:digit:]]*(\+.*)?$ && "$CI_COMMIT_REF_NAME" =~ ^release-.* ]]; then exit 1; fi
    - if [[ "$CI_COMMIT_BRANCH" == "master" ]]; then
        if [[ ! "$NEW_VERSION" =~ \.dev[[:digit:]]*$ ]]; then
          echo "[ERROR] Only .dev versions can be uploaded from the master branch.";
          exit 1;
        fi;
        if pip3 install --extra-index-url=$EXTRA_INDEX_URL "gtirb>$NEW_VERSION" 2>/dev/null; then
          echo "[ERROR] The package version being published on master should always be >= the version in the repository.";
          exit 1;
        fi;
        wget https://git.grammatech.com/research/templates/python-module/raw/master/delete_remote_packages.py;
        python3 delete_remote_packages.py $GL_PKG_API_TOKEN gtirb-*-py*-none-any.whl;
      fi
    - twine check gtirb-*-py*-none-any.whl
    - twine upload --verbose --repository repypi gtirb-*-py*-none-any.whl

# Apt packaging related jobs
.build-ubuntu-packages: &build-ubuntu-packages
  stage: build-installers
  artifacts:
    name: "$CI_COMMIT_REF_NAME-$CI_JOB_NAME"
    paths:
      - build
  script:
    - pip3 install setuptools wheel --upgrade
    - cd build
    - cpack -G "DEB" -D CPACK_GTIRB_PACKAGE=debian-lib;
    - cpack -G "DEB" -D CPACK_GTIRB_PACKAGE=debian-dev;
    - cpack -G "DEB" -D CPACK_GTIRB_PACKAGE=debian-debug;

build-ubuntu20-packages:
  needs: [build-ubuntu20-gcc]
  image: $DOCKER_REGISTRY/rewriting/gtirb/ubuntu20:$IMAGE_TAG
  <<: *build-ubuntu-packages

build-ubuntu22-packages:
  needs: [build-ubuntu22-gcc]
  image: $DOCKER_REGISTRY/rewriting/gtirb/ubuntu22:$IMAGE_TAG
  <<: *build-ubuntu-packages

build-ubuntu24-packages:
  needs: [build-ubuntu24-gcc]
  image: $DOCKER_REGISTRY/rewriting/gtirb/ubuntu24:$IMAGE_TAG
  <<: *build-ubuntu-packages

.setup-test-apt-repo: &setup-test-apt-repo
  stage: test-setup
  artifacts:
    name: "$CI_COMMIT_REF_NAME-$CI_JOB_NAME"
    paths:
      - apt-repo
  script:
    - mkdir apt-repo
    - cp build/*.deb apt-repo
    - cd apt-repo && dpkg-scanpackages . /dev/null > Packages


.test-ubuntu-libgtirb-dev: &test-ubuntu-libgtirb-dev
  stage: test-packages1
  artifacts:
    name: "$CI_COMMIT_REF_NAME-$CI_JOB_NAME"
    paths:
      - test-install
  script:
    - echo -e "\ndeb [trusted=yes] file:$(pwd)/apt-repo ./\n" >> /etc/apt/sources.list
    - cat /etc/apt/sources.list
    - 'TEST_PKG_NAME=$(dpkg --info apt-repo/libgtirb-dev_*.deb | sed -n "s/Package: //p")'
    - apt-get update -y && apt-get install -y --allow-unauthenticated $TEST_PKG_NAME
    - cp .ci/test-install.cpp ./
    - g++ test-install.cpp -std=c++17 -o test-install -lgtirb -lstdc++
    - ./test-install

.test-ubuntu-libgtirb: &test-ubuntu-libgtirb
  stage: test-packages2
  script:
    - echo -e "\ndeb [trusted=yes] file:$(pwd)/apt-repo ./\n" >> /etc/apt/sources.list
    - 'TEST_PKG_NAME=$(dpkg --info apt-repo/libgtirb_*.deb | sed -n "s/Package: //p")'
    - apt-get update -y && apt-get install -y --allow-unauthenticated $TEST_PKG_NAME
    - ./test-install

.test-ubuntu-libgtirb-dbg: &test-ubuntu-libgtirb-dbg
  stage: test-packages1
  script:
    - echo -e "\ndeb [trusted=yes] file:$(pwd)/apt-repo ./\n" >> /etc/apt/sources.list
    - 'TEST_PKG_NAME=$(dpkg --info apt-repo/libgtirb-dbg_*.deb | sed -n "s/Package: //p")'
    - apt-get update -y && apt-get install -y --allow-unauthenticated $TEST_PKG_NAME
    - '[ -f /usr/lib/debug/.build-id/$(readelf -n /usr/lib/libgtirb.so | grep ''Build ID: '' | cut -d":" -f2 | sed -E ''s/ ([a-f0-9]{2,})([a-f0-9]{30,})/\1\/\2/g'').debug ];'

setup-ubuntu20-test-apt-repo:
  image: $DOCKER_REGISTRY/rewriting/gtirb/ubuntu20:$IMAGE_TAG
  needs: [build-ubuntu20-packages]
  <<: *setup-test-apt-repo

setup-ubuntu22-test-apt-repo:
  image: $DOCKER_REGISTRY/rewriting/gtirb/ubuntu22:$IMAGE_TAG
  needs: [build-ubuntu22-packages]
  <<: *setup-test-apt-repo

setup-ubuntu24-test-apt-repo:
  image: $DOCKER_REGISTRY/rewriting/gtirb/ubuntu24:$IMAGE_TAG
  needs: [build-ubuntu24-packages]
  <<: *setup-test-apt-repo

test-ubuntu20-libgtirb-dev:
  image: $DOCKER_REGISTRY/rewriting/gtirb/ubuntu20:$IMAGE_TAG
  needs: [setup-ubuntu20-test-apt-repo]
  <<: *test-ubuntu-libgtirb-dev

test-ubuntu22-libgtirb-dev:
  image: $DOCKER_REGISTRY/rewriting/gtirb/ubuntu22:$IMAGE_TAG
  needs: [setup-ubuntu22-test-apt-repo]
  <<: *test-ubuntu-libgtirb-dev

test-ubuntu24-libgtirb-dev:
  image: $DOCKER_REGISTRY/rewriting/gtirb/ubuntu24:$IMAGE_TAG
  needs: [setup-ubuntu24-test-apt-repo]
  <<: *test-ubuntu-libgtirb-dev

test-ubuntu20-libgtirb-dbg:
  image: $DOCKER_REGISTRY/rewriting/gtirb/ubuntu20:$IMAGE_TAG
  needs: [setup-ubuntu20-test-apt-repo]
  <<: *test-ubuntu-libgtirb-dbg

test-ubuntu22-libgtirb-dbg:
  image: $DOCKER_REGISTRY/rewriting/gtirb/ubuntu22:$IMAGE_TAG
  needs: [setup-ubuntu22-test-apt-repo]
  <<: *test-ubuntu-libgtirb-dbg

test-ubuntu24-libgtirb-dbg:
  image: $DOCKER_REGISTRY/rewriting/gtirb/ubuntu24:$IMAGE_TAG
  needs: [setup-ubuntu24-test-apt-repo]
  <<: *test-ubuntu-libgtirb-dbg

test-ubuntu20-libgtirb:
  image: $DOCKER_REGISTRY/rewriting/gtirb/ubuntu20:$IMAGE_TAG
  needs: [setup-ubuntu20-test-apt-repo,test-ubuntu20-libgtirb-dev]
  <<: *test-ubuntu-libgtirb

test-ubuntu22-libgtirb:
  image: $DOCKER_REGISTRY/rewriting/gtirb/ubuntu22:$IMAGE_TAG
  needs: [setup-ubuntu22-test-apt-repo,test-ubuntu22-libgtirb-dev]
  <<: *test-ubuntu-libgtirb

test-ubuntu24-libgtirb:
  image: $DOCKER_REGISTRY/rewriting/gtirb/ubuntu24:$IMAGE_TAG
  needs: [setup-ubuntu24-test-apt-repo,test-ubuntu24-libgtirb-dev]
  <<: *test-ubuntu-libgtirb

.debian-installer: &debian-installer
  stage: deploy
  artifacts:
    name: "$CI_COMMIT_REF_NAME-$CI_JOB_NAME"
    paths:
      - '*gtirb*.deb'
  script:
    - cp build/*gtirb*.deb ./

debian-installer-ubuntu20:
  image: $DOCKER_REGISTRY/rewriting/gtirb/ubuntu20:$IMAGE_TAG
  needs: [test-ubuntu20-libgtirb, build-ubuntu20-packages]
  <<: *debian-installer

.apt-upload: &apt-upload
  stage: deploy-apt
  trigger:
    project: rewriting/utility/package-uploader
    strategy: depend

apt-public-ubuntu20-unstable:
  <<: *apt-upload
  rules:
    - if: '$CI_COMMIT_BRANCH == "master"'
  variables:
    JOB_NAME: debian-installer-ubuntu20
    APT_REPO: public
    APT_REPO_CODENAMES: focal
    APT_REPO_COMPONENT: unstable

apt-public-ubuntu20-stable:
  <<: *apt-upload
  rules:
    - if: '$CI_COMMIT_REF_NAME =~ /^release-.*/'
  variables:
    JOB_NAME: debian-installer-ubuntu20
    APT_REPO: public
    APT_REPO_CODENAMES: focal
    APT_REPO_COMPONENT: stable

apt-internal-ubuntu20-unstable:
  <<: *apt-upload
  rules:
    - if: '$CI_COMMIT_BRANCH == "master"'
  variables:
    JOB_NAME: debian-installer-ubuntu20
    APT_REPO: internal
    APT_REPO_CODENAMES: focal
    APT_REPO_COMPONENT: unstable

apt-internal-ubuntu20-stable:
  <<: *apt-upload
  rules:
    - if: '$CI_COMMIT_REF_NAME =~ /^release-.*/'
  variables:
    JOB_NAME: debian-installer-ubuntu20
    APT_REPO: internal
    APT_REPO_CODENAMES: focal
    APT_REPO_COMPONENT: stable

maven-central-upload:
  stage: deploy
  needs: [build-java]
  trigger:
    project: rewriting/utility/package-uploader
    strategy: depend
  rules:
    - if: '$CI_COMMIT_REF_NAME == "master"'
    - if: '$CI_COMMIT_REF_NAME =~ /^release-.*/'
  variables:
    JOB_NAME: build-java
    JAVA_POM_SUBDIR: ./build/java

.windows-upload: &windows-upload
  stage: upload
  trigger:
    project: rewriting/utility/package-uploader
    strategy: depend
  needs: [conan-windows-release]

windows-upload-public:
  <<: *windows-upload
  rules:
    - if: '$CI_COMMIT_REF_NAME =~ /^release-.*/'
    - if: '$CI_COMMIT_REF_NAME == "master"'
  variables:
    JOB_NAME: conan-windows-release
    FILESERVER: public
    FILESERVER_SUBDIR_NAME: windows-release

windows-upload-internal:
  <<: *windows-upload
  rules:
    - if: '$CI_COMMIT_REF_NAME =~ /^release-.*/'
    - if: '$CI_COMMIT_REF_NAME == "master"'
  variables:
    JOB_NAME: conan-windows-release
    FILESERVER: internal
    FILESERVER_SUBDIR_NAME: windows-release

wheel-upload-public:
  stage: upload
  trigger:
    project: rewriting/utility/package-uploader
    strategy: depend
  needs: [python-wheel-unstable]
  rules:
    - if: '$CI_COMMIT_REF_NAME == "master"'
  variables:
    JOB_NAME: python-wheel-unstable
    FILESERVER: public
    FILESERVER_SUBDIR_NAME: python


================================================
FILE: .ci/pre-commit
================================================
#!/bin/bash
OUTPUT=$(git clang-format --diff)
if [ "${OUTPUT}" == "no modified files to format" ] ||
   [ "${OUTPUT}" == "clang-format did not modify any files" ];then
    exit 0
else
    echo "Run git clang-format, then commit."
    exit 1
fi


================================================
FILE: .ci/test-install-all.sh
================================================
#!/bin/sh -e

set -o xtrace
set -o nounset
set -o errexit

builddir=$(pwd)
workdir=`mktemp -d`
trap 'cd / ; rm -rf $workdir' EXIT
cd $workdir

# Compile and run a C++ file that links to libgtirb
cp $builddir/.ci/test-install.cpp ./
make CXXFLAGS=-std=c++17 LDLIBS=-lgtirb test-install
./test-install


================================================
FILE: .ci/test-install-static.sh
================================================
#!/bin/sh -e

set -o xtrace
set -o nounset
set -o errexit

builddir=$(pwd)
workdir=`mktemp -d`
trap 'cd / ; rm -rf $workdir' EXIT
cd $workdir

# Compile and run a C++ file that links to libgtirb statically
cp $builddir/.ci/test-install.cpp ./
make 'CXXFLAGS=-std=c++17' 'LDLIBS=-lgtirb -lgtirb_proto -lprotobuf -lpthread' test-install
./test-install


================================================
FILE: .ci/test-install.cpp
================================================
#include <gtirb/gtirb.hpp>
#include <cstdio>
#include <fstream>

int main() {
  auto filename = std::tmpnam(nullptr);
  std::ofstream ofs{filename, std::ios_base::binary};
  auto ctx1 = gtirb::Context();
  auto ir1 = gtirb::IR::Create(ctx1);
  ir1->save(ofs);
  ofs.close();
  std::ifstream ifs{filename, std::ios_base::binary};
  auto ctx2 = gtirb::Context();
  if (auto ir2 = gtirb::IR::load(ctx2, ifs)) {

    return ir2.get()->modules().empty() ? 0 : 1;
  };
  return 1;
}


================================================
FILE: .ci/test-install.lisp
================================================
(in-package :gtirb)

(uiop/stream:with-temporary-file (:pathname path :keep nil)
  (let ((it (make-instance 'gtirb))
        (test-string "Something."))
    (push (cons "test" (make-instance 'aux-data)) (aux-data it))
    (setf (aux-data-type (cdar (aux-data it))) :string
          (aux-data-data (cdar (aux-data it))) test-string)
    (write-gtirb it path)
    (assert (string= (aux-data-data (cdar (aux-data (read-gtirb path))))
                     test-string)
            (path) "AuxData in GTIRB at ~s holds ~s." path test-string)))


================================================
FILE: .ci/test-install.py
================================================
import sys
import tempfile

import gtirb

filename = tempfile.mktemp()
ir = gtirb.IR()
ir.save_protobuf(filename)
ir = gtirb.IR.load_protobuf(filename)
sys.exit(len(ir.modules))


================================================
FILE: .ci/test-interop.sh
================================================
#!/bin/bash
set -e
cd build

failures=0

check() {
    local creator=$1
    local auxdata=$2
    local consumer=$3
    shift 3

    if "$@" ; then
        echo $creator $auxdata AuxData work in $consumer
    else
        failures=$(( failures + 1))
    fi
}

### floating-point compatiblity test

bin/test_floats -w floats_cpp.gtirb
python3 src/test/testInterop/test_floats.py -w floats_py.gtirb

check python float c++ \
    bin/test_floats -r floats_py.gtirb
check c++ float python \
    python3 src/test/testInterop/test_floats.py -r floats_cpp.gtirb

rm floats_{cpp,py}.gtirb

### variant compatibility test

bin/test_variants -w variants_cpp.gtirb
python3 src/test/testInterop/test_variants.py -w variants_py.gtirb

check c++ variant python \
    python3 src/test/testInterop/test_variants.py -r variants_cpp.gtirb
check python variant c++ \
    bin/test_variants -r variants_py.gtirb

rm variants_{cpp,py}.gtirb

test $failures = 0


================================================
FILE: .clang-format
================================================
---
Language:        Cpp
# BasedOnStyle:  LLVM
AccessModifierOffset: -2
AlignAfterOpenBracket: Align
AlignConsecutiveAssignments: false
AlignConsecutiveDeclarations: false
AlignEscapedNewlinesLeft: false
AlignOperands:   true
AlignTrailingComments: true
AllowAllParametersOfDeclarationOnNextLine: true
AllowShortBlocksOnASingleLine: false
AllowShortCaseLabelsOnASingleLine: false
AllowShortFunctionsOnASingleLine: All
AllowShortIfStatementsOnASingleLine: false
AllowShortLoopsOnASingleLine: false
AlwaysBreakAfterDefinitionReturnType: None
AlwaysBreakAfterReturnType: None
AlwaysBreakBeforeMultilineStrings: false
AlwaysBreakTemplateDeclarations: false
BinPackArguments: true
BinPackParameters: true
BraceWrapping:
  AfterClass:      false
  AfterControlStatement: false
  AfterEnum:       false
  AfterFunction:   false
  AfterNamespace:  false
  AfterObjCDeclaration: false
  AfterStruct:     false
  AfterUnion:      false
  BeforeCatch:     false
  BeforeElse:      false
  IndentBraces:    false
BreakBeforeBinaryOperators: None
BreakBeforeBraces: Attach
BreakBeforeTernaryOperators: true
BreakConstructorInitializersBeforeComma: false
BreakAfterJavaFieldAnnotations: false
BreakStringLiterals: true
ColumnLimit:     80
CommentPragmas:  '^ IWYU pragma:'
ConstructorInitializerAllOnOneLineOrOnePerLine: false
ConstructorInitializerIndentWidth: 4
ContinuationIndentWidth: 4
Cpp11BracedListStyle: true
DerivePointerAlignment: false
DisableFormat:   false
ExperimentalAutoDetectBinPacking: false
ForEachMacros:   [ foreach, Q_FOREACH, BOOST_FOREACH ]
# IncludeBlocks: Regroup
IncludeCategories:
  - Regex:           '^".*"'
    Priority:        1
  - Regex:           '^<gtirb/.*'
    Priority:        2
  - Regex:           '^<proto/.*'
    Priority:        2
#IncludeIsMainRegex: '([-_](test|unittest))?$'
IndentCaseLabels: false
IndentWidth:     2
IndentWrappedFunctionNames: false
JavaScriptQuotes: Leave
JavaScriptWrapImports: true
KeepEmptyLinesAtTheStartOfBlocks: true
MacroBlockBegin: ''
MacroBlockEnd:   ''
MaxEmptyLinesToKeep: 1
NamespaceIndentation: None
ObjCBlockIndentWidth: 2
ObjCSpaceAfterProperty: false
ObjCSpaceBeforeProtocolList: true
PenaltyBreakBeforeFirstCallParameter: 19
PenaltyBreakComment: 300
PenaltyBreakFirstLessLess: 120
PenaltyBreakString: 1000
PenaltyExcessCharacter: 1000000
PenaltyReturnTypeOnItsOwnLine: 60
PointerAlignment: Left
ReflowComments:  true
SortIncludes:    true
SpaceAfterCStyleCast: false
SpaceAfterTemplateKeyword: true
SpaceBeforeAssignmentOperators: true
SpaceBeforeParens: ControlStatements
SpaceInEmptyParentheses: false
SpacesBeforeTrailingComments: 1
SpacesInAngles:  false
SpacesInContainerLiterals: true
SpacesInCStyleCastParentheses: false
SpacesInParentheses: false
SpacesInSquareBrackets: false
Standard:        Cpp11
TabWidth:        8
UseTab:          Never
---
Language:        Proto
---
Language:        Java
IndentWidth:     4
...


================================================
FILE: .clang-tidy
================================================
---
Checks:          '-*,clang-analyzer-*,bugprone*,modernize*,performance*,-modernize-pass-by-value,-modernize-use-auto,-modernize-use-using,-performance-unnecessary-value-param,-modernize-use-trailing-return-type'
WarningsAsErrors: ''
HeaderFilterRegex: ''
AnalyzeTemporaryDtors: false
FormatStyle:     none
...


================================================
FILE: .cmake-format.yaml
================================================
# disable splitting of arguments based on the sheer number of them;
# prefer to split by line length
max_subargs_per_line: 9999
# layout parens in CMake like how we layout brackets in C++
dangle_parens: true
# match the case of intrinsics as used through most of the codebase previosly
command_case: lower
keyword_case: upper
# try autosort (disable this if it causes bugs)
autosort: true


================================================
FILE: .dockerignore
================================================
.git/
.ci/


================================================
FILE: .flake8
================================================
# Black feels free to violate some rules because they're PEP8 extensions and
# not PEP8 itself. So we must ignore:
#   E203: Whitespace before ':': Black does "a[b : c]"; flake8 wants "a[b:c]".
#   W503: Line break occurred before a binary operator: Black puts operators in front of lines, flake8 wants them after.
# more detail is available at https://black.readthedocs.io/en/stable/the_black_code_style.html.

[flake8]
ignore = E203,W503

# Ignore unused variables in tests, which tend to come up when building gtirb.
per-file-ignores =
  python/tests/*:F841


================================================
FILE: .github/workflows/actions.yml
================================================
name: GTIRB Docs
on: [push]

jobs:
  docker:
    runs-on: ubuntu-latest
    permissions:
      packages: write
    strategy:
      matrix:
        os: [focal]
        include:
          - os: focal
            file_suffix: ubuntu20
    outputs:
      image_tag: ${{ steps.vars.outputs.image_tag }}
      image_path: ${{ steps.vars.outputs.image_path }}
    steps:
        # We must generate output variables here in order to ensure the
        # reference is lowercase, even if the repository reference is not
        # (e.g., because of the organization "GrammaTech").
        # For the tag, we replace forward slashes with hyphens and use the tag
        # the "latest" for the "master" branch.
        # We'd like to just generate the environment variables, but the `env`
        # context is not available in the "jobs.<id>.container" field, despite
        # what the Context Availability documentation says. See:
        # https://docs.github.com/en/actions/learn-github-actions/contexts#context-availability
      - id: vars
        run: |
          export IMAGE_TAG=$([ "${{ github.ref_name }}" == "master" ] && echo latest || echo ${{ github.ref_name }} | sed -e "s/\//-/g")
          echo "image_tag=$IMAGE_TAG" >> $GITHUB_ENV
          echo "image_tag=$IMAGE_TAG" >> $GITHUB_OUTPUT
          export IMAGE_PATH=$(echo ghcr.io/${{ github.repository }}/ | awk '{print tolower($0)}')
          echo "image_path=$IMAGE_PATH" >> $GITHUB_ENV
          echo "image_path=$IMAGE_PATH" >> $GITHUB_OUTPUT
      - uses: actions/checkout@master
      - name: Build image
        env:
          image_reference: ${{ env.image_path }}${{ matrix.os }}
        run: |
          buildah login -u ${{ github.actor }} -p ${{ secrets.GITHUB_TOKEN }} ghcr.io
          buildah build \
              -f .ci/Dockerfile.${{ matrix.file_suffix }} \
              --cache-from ${{ env.image_reference }}-cache \
              --cache-to ${{ env.image_reference }}-cache \
              --layers \
              --tag ${{ env.image_reference }}:${{ env.image_tag }}
          buildah push ${{ env.image_reference }}:${{ env.image_tag }}

  docs:
    runs-on: ubuntu-latest
    permissions:
      packages: read
    strategy:
      matrix:
        os: [focal]
    needs: docker
    container: ${{ needs.docker.outputs.image_path }}${{ matrix.os }}:${{ needs.docker.outputs.image_tag }}
    steps:
      - name: Checkout
        uses: actions/checkout@v3
      - name: Generate documentation
        run: |
          cmake -DGTIRB_ENABLE_TESTS=OFF -B build .
          cd build/python
          pip install -e '.[doc]'
          cd ..
          cmake ..
          make doc
          mv doc/html ../public
      - name: Upload GitHub Pages artifact
        uses: actions/upload-pages-artifact@v3
        with:
          path: public

  deploy-pages:
    needs: docs
    if: github.ref == 'refs/heads/master'
    permissions:
      pages: write
      id-token: write

    environment:
      name: github-pages
      url: ${{ steps.deployment.outputs.page_url }}

    runs-on: ubuntu-latest
    steps:
      - name: Deploy to GitHub Pages
        id: deployment
        uses: actions/deploy-pages@v4


================================================
FILE: .gitignore
================================================
*~
*.fasl
*.o
*.out
*.pc
out.gtir
CMakeCache.txt
CMakeFiles
CMakeScripts
Testing
Makefile
cmake_install.cmake
install_manifest.txt
compile_commands.json
CTestTestfile.cmake
build/
build-doc/
bin/
doc/html/
googletest-download/
googletest-src/
gsl-download/
gsl-src/
include/gsl/
include/proto/
wiki/
scratch.lisp
/include/gtirb/version.h
/java/com/grammatech/gtirb/proto/
.mypy_cache/
__pycache__/
.vscode/

.gtirb.pdf


================================================
FILE: .gtirb.tex
================================================
\begin{tikzpicture}%% Caption: GrammaTech IR for Binaries is a data structure that implicitly represents binary structures required for modification.  Elements postifxed with "(1)" are singleton in any IR instance every other structure can appear in multiple.  Every elements is assigned a Universal Unique Identifier (UUID) which can be used to reference the element from an AuxData table.  AuxData tables hold open-ended analysis results.
  %% #fig:gtirb
  [
    object/.style = {draw},
    owner/.style = {thick},
    owner-many/.style = {-triangle 90 reversed,thick},
    reference/.style = {owner, dashed, ->},
  ]
  \node[object, ] (ir) {IR (1)};
  \node[object, below right=1em and 2em of ir, text width=6.25em] (ad0) {AuxData};
  \node[below=0.25em of ad0.south] (ad1) {ID1 \& DATA1};
  \node[below=0em of ad1] (ad2) {ID2 \& DATA2};
  \node[below=0em of ad2] (ad3) {ID3 \& DATA3};
  \node[below=0em of ad3] (ad4) {\ldots{}};
  \node[fit={(ad1) (ad4)}, draw, thick, dotted, inner sep=0.25em] (auxdata) {};
  \node[right=2em of auxdata] (anything) {{\em any UUID}};
  \node[object, above right=4.5em and 2em of ir] (cfg) {CFG (1)};
  \node[object, right=4em of cfg, text width=5em] (edges) {Edges};

  \node[object, right=4em of ir, text width=6em] (modules) {Modules};
  \node[object, below right=1em and 4em of modules, text width=6em] (symbols) {Symbols};

  \node[object, right=4em of modules, text width=6em] (sections) {Sections};

  \node[object, right=2em of sections, text width=8em] (byteintervals) {ByteIntervals};

  \node[object, above=2em of byteintervals, text width=8em] (proxies) {Proxy blocks};
  \node[object, right=2.5em of proxies, text width=7em] (codeblocks) {Code Blocks};
  \node[object, below=0.5em of codeblocks, text width=7em] (datablocks) {Data Blocks};
  \node[fit={(proxies) (codeblocks)}, draw, thick, dotted] (edgeblocks) {};
  \node[] at (edges -| proxies) (eblocks) {Edge Blocks};
  \node[fit={(codeblocks) (datablocks)}, draw, thick, dotted, inner sep=0.75em] (byteblocks) {};
  \node[] at (eblocks -| byteblocks) (bblocks) {Byte Blocks};

  \node[object, below right=1em and 2.5em of byteintervals, text width=10.5em] (symexpr) {SymbolicExpressions};

  %% References
  \draw[reference] (edges.east) |- (eblocks);
  \draw[reference] (edges.east) -| ++(2,1) -| (bblocks.north);
  \draw[reference] (symbols.east) -| ++(2,-1) -| (symexpr.south);
  \draw[reference] (auxdata) -- (anything);

  %% Ownership
  \draw[owner-many] (ir) -- (modules);
  \draw[owner] (ir) -- ++(1.0,0) |- (cfg);
  \draw[owner-many] (ir) -- ++(1.0,0) |- (ad0);
  \draw[owner-many] (cfg) -- (edges);
  \draw[owner-many] (modules) -- ++(1.5,0) |- (symbols);
  \draw[owner-many] (modules) -- (sections);
  \draw[owner-many] (modules) -- ++(1.5,0) |- (edgeblocks);
  \draw[owner-many] (modules.south) -- (ad0.north-|modules.south);
  \draw[owner-many] (sections) -- (byteintervals);
  \draw[owner-many] (byteintervals) -- ++(1.75,0) |- (symexpr);
  \draw[owner-many] (byteintervals) -- ++(1.75,0) |- (bblocks);

  %% Local Variables:
  %% mode: latex
  %% end:
\end{tikzpicture}


================================================
FILE: .isort.cfg
================================================
# Settings are chosen to be compatible with black:
#   https://black.readthedocs.io/en/stable/the_black_code_style.html#how-black-wraps-lines
# For details on each setting:
#   https://github.com/timothycrosley/isort/wiki/isort-Settings
[settings]
line_length=79
multi_line_output=3
include_trailing_comma=true
force_grid_wrap=0


================================================
FILE: .lisp-format
================================================
;;;; -*- emacs-lisp -*-
;;;;
;;;; For information about how to use lisp-format see it's
;;;; documentation, which is available in a comment at the top of the
;;;; lisp-format script or, equivalently, in the README available at:
;;;;
;;;;     https://github.com/eschulte/lisp-format
;;;;
(mapc (lambda (dir) (add-to-list 'load-path dir))
      (apply #'append
             (mapcar
              (lambda (pkg-glob)
                (cl-loop for path in
                   (directory-files
                    ;; Use quicklisp if the user has it setup.
                    (if (getenv "QUICK_LISP")
                        (concat (getenv "QUICK_LISP") "/dists/quicklisp/software/")
                      ;; Search for the site-lisp path in load-path
                      (add-to-list 'load-path "/usr/share/emacs25/site-lisp/elpa/")
                      (add-to-list 'load-path "/usr/share/emacs/site-lisp/elpa/")
                      (cl-loop for path in load-path
                         if (and (string-match-p "site-lisp" path)
                                 (file-expand-wildcards (concat (file-name-as-directory path) "slime*")))
                         do (cl-return path)))
                    t pkg-glob)
                   if (file-directory-p path) collect path))
              (list "slime*" "paredit*"))))

(defun verbose-require (package)
  (unless (ignore-errors (require package))
    (message "Failed to load the package '%S'." package)
    (message "Ensure %s is installed locally, and then edit your" package)
    (message "\"~/.lisp-formatrc\" file adding %s to your load path.\n" package)
    (message "    (add-to-list 'load-path </path/to/%s.el>)\n" package)
    ;; After printing the messages require again to trigger the error.
    (require package)))
(verbose-require 'slime)
(verbose-require 'paredit)

(set-default 'indent-tabs-mode nil)
(pushnew 'untabify *lisp-format-fixers*)

(defun fix-trailing-parens (start end &optional _arg)
  "Use `paredit-close-parenthesis' to fix trailing parens."
  (interactive (if current-prefix-arg
                   (list (point-min) (point-max) current-prefix-arg)
                 (list (region-beginning) (region-end) nil)))
  (let ((c (current-column)))
    (save-excursion
      (save-restriction
        (narrow-to-region (point-min) end)
        (goto-char start)
        (while (re-search-forward "^ *)" nil t)
        (forward-char -1)
        (paredit-close-parenthesis))))
  (move-to-column c)))
(pushnew 'fix-trailing-parens *lisp-format-fixers*)

;;; Syntax table extension for curry-compose-reader-macros
(modify-syntax-entry ?\[ "(]" lisp-mode-syntax-table)
(modify-syntax-entry ?\] ")[" lisp-mode-syntax-table)
(modify-syntax-entry ?\{ "(}" lisp-mode-syntax-table)
(modify-syntax-entry ?\} "){" lisp-mode-syntax-table)
(modify-syntax-entry ?\« "(»" lisp-mode-syntax-table)
(modify-syntax-entry ?\» ")«" lisp-mode-syntax-table)

;;; Specify indentation levels for specific functions.
(mapc (lambda (pair) (put (first pair) 'lisp-indent-function (second pair)))
      '((make-instance 1)
        (if-let 1)
        (if-let* 1)
        (when-let 1)
        (when-let* 1)
        (defixture 1)
        (lambda-bind 1)
        (signals 1)
        (match 1)
        (start-case 1)
        (define-proto-backed-class 4)
        (register-groups-bind 2)))

(defun define-feature-lisp-indent
    (path state indent-point sexp-column normal-indent)
  "Indentation function called by `lisp-indent-function' for define-feature."
  ;; (message "CALLED: %S"
  ;;          (list 'define-feature-lisp-indent
  ;;                path state indent-point sexp-column normal-indent))
  (cond
   ((equalp path '(2)) 2)   ; Doc string for enclosing define-feature.
   ((equalp path '(3)) 2)   ; Extractor function definition.
   ((equalp path '(3 2)) 4) ; Doc string for extractor.
   ((equalp path '(4)) 2)   ; Merge function definition.
   (t nil)))                ; Otherwise do the default.
(put 'define-feature 'lisp-indent-function 'define-feature-lisp-indent)


================================================
FILE: .pre-commit-config.yaml
================================================
repos:
  - repo: https://github.com/psf/black
    rev: 22.3.0
    hooks:
      - id: black
        args: ["--line-length", "79"]
      - id: black
        name: black (.pyi)
        args: ["--line-length", "79"]
        types: [pyi]
  - repo: local
    hooks:
      - id: clang-format
        name: clang-format
        language: system
        files: \.(c|h|cpp|hpp|proto|java)$
        entry: clang-format -i
  - repo: https://github.com/eschulte/lisp-format
    rev: master
    hooks:
      - id: lisp-format
        name: lisp-format
        args: [-style=file]
  - repo: https://github.com/pre-commit/pre-commit-hooks
    rev: v2.4.0
    hooks:
      - id: end-of-file-fixer
      - id: trailing-whitespace
        args: ["--chars"," \t"]
      - id: check-merge-conflict
      - id: check-yaml
        args: [--allow-multiple-documents]
      - id: debug-statements
      - id: mixed-line-ending
  - repo: https://github.com/iconmaster5326/cmake-format-pre-commit-hook
    rev: v0.6.2
    hooks:
      - id: cmake-format
        exclude: build
  - repo: https://github.com/timothycrosley/isort
    rev: 5.13.2
    hooks:
      - id: isort
        files: \.py$
  - repo: https://github.com/PyCQA/flake8
    rev: 7.1.0
    hooks:
      - id: flake8


================================================
FILE: AlignOf.cmake
================================================
macro(ALIGNOF TYPE LANG NAME)
  if(NOT ALIGNOF_${NAME})
    #
    # Try to compile and run a foo grogram. The alignment result will be stored
    # in ALIGNOF_${CHECK_TYPE}
    #

    set(INCLUDE_HEADERS
        "#include <stddef.h>
			#include <stdio.h>
			#include <stdlib.h>"
    )

    foreach(File ${CMAKE_REQUIRED_INCLUDES})
      set(INCLUDE_HEADERS "${INCLUDE_HEADERS}\n#include <${File}>\n")
    endforeach()

    set(INCLUDE_HEADERS "${INCLUDE_HEADERS}\n#include <stdint.h>\n")

    file(
      WRITE
      "${CMAKE_BINARY_DIR}${CMAKE_FILES_DIRECTORY}/CMakeTmp/c_get_${NAME}_alignment.${LANG}"
      "${INCLUDE_HEADERS}
			int main(){
				char diff;
				struct foo {char a; ${TYPE} b;};
				struct foo *p = (struct foo *) malloc(sizeof(struct foo));
				diff = ((char *)&p->b) - ((char *)&p->a);
				return diff;
			}"
    )

    try_run(
      ALIGNOF_${NAME}
      COMPILE_RESULT
      "${CMAKE_BINARY_DIR}${CMAKE_FILES_DIRECTORY}/CMakeTmp/"
      "${CMAKE_BINARY_DIR}${CMAKE_FILES_DIRECTORY}/CMakeTmp/c_get_${NAME}_alignment.${LANG}"
      COMPILE_OUTPUT_VARIABLE "ALIGNOF_${NAME}_COMPILE_VAR"
    )

    if(NOT COMPILE_RESULT)
      message(
        FATAL_ERROR
          "Check alignment of ${TYPE} in ${LANG}: compilation failed: ${ALIGNOF_${NAME}_COMPILE_VAR}"
      )
    else()
      message(
        STATUS "Check alignment of ${TYPE} in ${LANG}: ${ALIGNOF_${NAME}}"
      )
    endif()
  endif()
endmacro()


================================================
FILE: AuxData.md
================================================
Standard AuxData Schemata
=========================

The \ref AUXDATA_GROUP class provides generic storage for
application-specific data. This allows data to be attached to either
the IR or Module classes in GTIRB.

We specify a small number of standard gtirb::AuxData schemata to
support interoperability. These are listed below, in two sets:

- [Sanctioned](#sanctioned-auxdata-tables) Recommended for GTIRB
  users. Individual schemata are unlikely to change in future,
  although the set of Sanctioned schemata may grow.

- [Provisional](#provisional-auxdata-tables) Under consideration for
  'sanctioned' status.

For example, if you want to store alignment requirements for blocks
and data objects, you can use an [alignment](#alignment) table.

```c++
// Leverage definitions for the sanctioned AuxData tables.
#include <gtirb/AuxDataSchema.hpp>

// Define your own custom AuxData tables.
// By convention, we put these in the namespace gtirb::schema.
//
// Note that if the custom type requires custom serialization, a
// specialization of the auxdata_traits template also has to be
// provided. We provide default specializations for many standard
// types.
namespace gtirb {
namespace schema {
struct MyAuxDataFoo {
  static constexpr const char* Name = "foo";
  typedef Foo Type;
};
}
}

using namespace gtirb;
using namespace schema;

// Register AuxData types before using GTIRB.
void call_me_from_main()
{
  AuxDataContainer::registerAuxDataType<Alignment>();
  AuxDataContainer::registerAuxDataType<MyAuxDataFoo>();
}

void do_stuff_with_gtirb()
{
  Context C;
  IR& ir = *IR::Create(C);
  ir.addModule(Module::Create(C));
  Module& module = *ir.modules_begin();

  // Attach an empty alignment table to the internal representation
  module.addAuxData<Alignment>(std::map<UUID, uint64_t>{});

  //...

  // Create a new block
  Section* section = module.addSection(C, ".text");
  ByteInterval* interval = section->addByteInterval(C, Addr(400), 1000);
  CodeBlock* b1 = interval->addBlock<CodeBlock>(C, 64, 6);

  // Record that the block should be aligned to 8-byte boundaries.
  // First fetch the map AuxData.
  auto* align_map = module.getAuxData<Alignment>();

  // Check for null if you don't know that the module definitely has
  // an existing Alignment AuxData attached.
  if (align_map)
    (*align_map)[b1->getUUID()] = 8;

  // Attach a custom "Foo" object.
  // Note that AuxData uses a move reference
  Foo my_foo = BuildAFoo();
  module.addAuxData<MyAuxDataFoo>(std::move(my_foo));

  // Subsequently access the Foo table through the AuxData interface.
  module.getAuxData<MyAuxDataFoo>()->some_member_function();
}
```


## Sanctioned AuxData Tables

The following are the sanctioned AuxData table schemata.


| Label                                     | Type                                               |
|-------------------------------------------|----------------------------------------------------|
| [`"elfDynamicInit"`](#elfDynamicInit)     | ```gtirb::UUID```                                  |
| [`"elfDynamicFini"`](#elfDynamicFini)     | ```gtirb::UUID```                                  |
| [`"elfSoname"`](#elfSoname)               | ```std::string```                                  |
| [`"elfStackExec"`](#elfStackExec)         | ```bool```                                         |
| [`"elfStackSize"`](#elfStackSize)         | ```uint64_t```                                     |
| [`"functionBlocks"`](#functionblocks)     | ```std::map<gtirb::UUID, std::set<gtirb::UUID>>``` |
| [`"functionEntries"`](#functionentries)   | ```std::map<gtirb::UUID, std::set<gtirb::UUID>>``` |
| [`"functionNames"`](#functionnames)       | ```std::map<gtirb::UUID, gtirb::UUID>```           |
| [`"types"`](#types)                       | ```std::map<gtirb::UUID, std::string>```           |
| [`"alignment"`](#alignment)               | ```std::map<gtirb::UUID, uint64_t>```              |
| [`"comments"`](#comments)                 | ```std::map<gtirb::Offset, std::string>```         |
| [`"symbolForwarding"`](#symbolforwarding) | ```std::map<gtirb::UUID, gtirb::UUID>```           |
| [`"padding"`](#padding)                   | ```std::map<gtirb::Offset, uint64_t>```            |


### elfDynamicInit

| <!-- --> | <!-- -->                                           |
|----------|----------------------------------------------------|
| Label    | ```"elfDynamicInit"```                             |
| Type     | ```gtirb::UUID```                                  |
| Value    |  CodeBlock UUID                                    |
| AttachedTo | gtirb::Module |
| Note     | The CodeBlock to which a DT_INIT entry in an ELF file's .dynamic section refers. |

### elfDynamicFini

| <!-- --> | <!-- -->                                           |
|----------|----------------------------------------------------|
| Label    | ```"elfDynamicFini"```                             |
| Type     | ```gtirb::UUID```                                  |
| Value    |  CodeBlock UUID                                    |
| AttachedTo | gtirb::Module |
| Note     | The CodeBlock to which a DT_FINI entry in an ELF file's .dynamic section refers. |

### elfSoname

| <!-- --> | <!-- -->                                           |
|----------|----------------------------------------------------|
| Label    | ```"elfSoname"```                                  |
| Type     | ```std::string```                                  |
| Value    | The SONAME of a library.                           |
| AttachedTo | gtirb::Module |
| Note     | The string value which the DT_SONAME entry in an ELF file's .dynamic section contains. |

### elfStackExec

| <!-- --> | <!-- -->                                           |
|----------|----------------------------------------------------|
| Label    | ```"elfStackExec"```                               |
| Type     | ```bool```                                         |
| Value    | Stack executable flag specified by PT_GNU_STACK segment in ELF files. |
| AttachedTo | gtirb::Module |

### elfStackSize

| <!-- --> | <!-- -->                                           |
|----------|----------------------------------------------------|
| Label    | ```"elfStackSize"```                               |
| Type     | ```uint64_t```                                     |
| Value    | The size of the PT_GNU_STACK segment in ELF files, which may influence the runtime stack size in certain environments. |
| AttachedTo | gtirb::Module |

### functionBlocks

| <!-- --> | <!-- -->                                           |
|----------|----------------------------------------------------|
| Label    | ```"functionBlocks"```                             |
| Type     | ```std::map<gtirb::UUID, std::set<gtirb::UUID>>``` |
| Key      | Function UUID.                                     |
| Value    | The set of UUIDs of all the blocks (gtirb::CodeBlock) in the function. |
| AttachedTo | gtirb::Module |
| Note     | This table identifies all of the gtirb::CodeBlocks that belong to each function. These do not necessarily have to be contiguous in the address space. Note that there is no function notion in the core GTIRB IR. A function's UUID is just a unique identifier that is consistently used across all function-related AuxData tables. |


### functionEntries

| <!-- --> | <!-- -->                                           |
|----------|----------------------------------------------------|
| Label    | ```"functionEntries"```                            |
| Type     | ```std::map<gtirb::UUID, std::set<gtirb::UUID>>``` |
| Key      | Function UUID.                                     |
| Value    | The set of UUIDs of all the entry blocks (gtirb::CodeBlock) for the function. |
| AttachedTo | gtirb::Module |
| Note     | This table identifies all gtirb::CodeBlocks that represent entry points to each function. A single function may have more than one entry point. Note that there is no function notion in the core GTIRB IR. A function's UUID is just a unique identifier that is consistently used across all function-related AuxData tables. |


### functionNames

| <!-- --> | <!-- -->                                                            |
|----------|---------------------------------------------------------------------|
| Label    | ```"functionNames"```                                               |
| Type     | ```std::map<gtirb::UUID, gtirb::UUID>```                            |
| Key      | Function UUID.                                                      |
| Value    | The UUID of a gtrb::Symbol whose `name` field contains the name of the function. |
| AttachedTo | gtirb::Module |
| Note     | There may be more than one gtirb::Symbol associated with the address(es) corresponding to the entry point(s) of a function. This table identifies a canonical gtirb::Symbol to be used for each function. Note that there is no function notion in the core GTIRB IR. A function's UUID is just a unique identifier that is consistently used across all function-related AuxData tables. |


### types

| <!-- --> | <!-- -->                                |
|----------|-----------------------------------------|
| Label    | ```"types"```                           |
| Type     | ```std::map<gtirb::UUID,std::string>``` |
| Key      | The gtirb::UUID of a gtirb::DataBlock. |
| Value    | The type of the data, expressed as a std::string containing a C++ type specifier. |
| AttachedTo | gtirb::Module |
| Note     | An entry in this table indicates that the given gtirb::DataBlock contains content that exhibits the given C++ type. |


### alignment

| <!-- --> | <!-- -->                                                  |
|----------|-----------------------------------------------------------|
| Label    | ```"alignment"```                                         |
| Type     | ```std::map<gtirb::UUID, uint64_t>```                     |
| Key      | The gtirb::UUID of a gtirb::CodeBlock, gtirb::DataBlock, or gtirb::Section. |
| Value    | Alignment requirements for the block/data object/section. |
| AttachedTo | gtirb::Module |
| Note     |  An entry in this table indicates that the given object's address is required to be evenly divisible by the alignment value. Typically the alignment value is a power of 2. |


### comments

| <!-- --> | <!-- -->                                   |
|----------|--------------------------------------------|
| Label    | ```"comments"```                           |
| Type     | ```std::map<gtirb::Offset, std::string>``` |
| Key      | The gtirb::Offset of a comment.            |
| Value    | A comment string relevant to the specified offset in the specified GTIRB entry. |
| AttachedTo | gtirb::Module |
| Note     | The gtirb::Offset refers to the UUID of an entity in memory and a byte offset within that entity to indicate the point at which the comment applies. Comments can contain arbitrary content and are likely generated by analysis tools. They often do not (but may) represent comments present in the original source code of the binary. |


### symbolForwarding

| <!-- --> | <!-- -->                                     |
|----------|----------------------------------------------|
| Label    | ```"symbolForwarding"```                     |
| Type     | ```std::map<gtirb::UUID,gtirb::UUID>```      |
| Key      | The gtirb::UUID of the "from" gtirb::Symbol. |
| Value    | The gtirb::UUID of the "to" gtirb::Symbol.   |
| AttachedTo | gtirb::Module |
| Note     | This table is intended to support cross-module references. A "from" symbol in one gtirb::Module may be dynamically bound at runtime to the "to" symbol in another gtirb::Module, thereby modeling dynamic library runtime linkage. |


### padding

| <!-- --> | <!-- -->                                       |
|----------|------------------------------------------------|
| Label    | ```"padding"```                                |
| Type     | ```std::map<gtirb::Offset, uint64_t>```        |
| Key      | The gtirb::Offset at which padding is present. |
| Value    | The length of the padding, in bytes.           |
| AttachedTo | gtirb::Module |
| Note     | Padding here may be 0's or it may be valid instructions. An entry in this table indicates that an analysis has determined that at the given gtirb::Offset (UUID of an entity in memory and byte offset into that entity) and length of bytes indicated constitute content that is unused by the program and is only present to ensure alignment of neighboring objects. Note: some disassemblers may still create a gtirb::CodeBlock or gtirb::DataBlock for the same portion of address space that a padding entry covers. |


## Provisional AuxData Tables

The following are the provisional AuxData table schemata.


| Label                                                       | Type                                                                                                         |
|-------------------------------------------------------------|--------------------------------------------------------------------------------------------------------------|
| [`"binaryType"`](#binarytype)                               | ```std::vector<std::string>```                                                                               |
| [`"cfiDirectives"`](#cfidirectives)                         | ```std::map<gtirb::Offset, std::vector<std::tuple<std::string, std::vector<int64_t>, gtirb::UUID>>>```       |
| [`"elfSymbolInfo"`](#elfsymbolinfo)                         | ```std::map<gtirb::UUID, std::tuple<uint64_t, std::string, std::string, std::string, uint64_t>>```           |
| [`"elfSymbolVersions"`](#elfsymbolversions)                 | ```std::tuple<std::map<uint16_t, std::tuple<std::vector<std::string>, uint16_t>>, std::map<std::string, std::map<uint16_t, std::string>>, std::map<gtirb::UUID, std::tuple<uint16_t, bool>>>```           |
| [`"encodings"`](#encodings)                                 | ```std::map<gtirb::UUID, std::string>```                                                                     |
| [`"functionNameProbabilities"`](#functionnameprobabilities) | ```std::map<std::string, std::map<gtirb::UUID, std::vector<std::tuple<std::string, std::string, float>>>>``` |
| [`"includedLibraryNames"`](#includedlibrarynames)           | ```std::map<gtirb::UUID, std::string>```                                                                     |
| [`"includedLibraryVersions"`](#includedlibraryversions)     | ```std::map<gtirb::UUID, std::string>```                                                                     |
| [`"libraries"`](#libraries)                                 | ```std::vector<std::string>```                                                                               |
| [`"libraryPaths"`](#librarypaths)                           | ```std::vector<std::string>```                                                                               |
| [`"peExportEntries"`](#peexportentries)                     | ```std::vector<std::tuple<uint64_t, int64_t, std::string>>```                                                |
| [`"peExportedSymbols"`](#peexportedsymbols)                 | ```std::vector<gtirb::UUID>```                                                                               |
| [`"peImportEntries"`](#peimportentries)                     | ```std::vector<std::tuple<uint64_t, int64_t, std::string, std::string>>```                                   |
| [`"peImportedSymbols"`](#peimportedsymbols)                 | ```std::vector<gtirb::UUID>```                                                                               |
| [`"peResource"`](#peresource)                               | ```std::vector<std::tuple<std::vector<uint8_t>, gtirb::Offset, uint64_t>>```                                 |
| [`"profile"`](#profile)                                     | ```std::map<gtirb::UUID, uint64_t>```                                                                        |
| [`"prototypeTable"`](#prototypetable)                       | ```std::map<gtirb::UUID, gtirb::UUID>```                                                                     |
| [`"sccs"`](#sccs)                                           | ```std::map<gtirb::UUID, int64_t>```                                                                         |
| [`"sectionProperties"`](#sectionproperties)           | ```std::map<gtirb::UUID, std::tuple<uint64_t, uint64_t>>>>```                                                |
| [`"symbolicExpressionSizes"`](#symbolicexpressionsizes)     | ```std::map<gtirb::Offset, uint64_t>```                                                                      |
| [`"typeTable"`](#typetable)                                 | ```std::map<gtirb::UUID, std::variant<uint64_t, std::tuple<uint8_t>, std::tuple<int8_t, uint64_t>, uint64_t, uint64_t, std::tuple<gtirb::UUID, std::vector<gtirb::UUID>>, gtirb::UUID, std::tuple<gtirb::UUID, uint64_t>, tuple<uint64_t, std::vector<tuple<uint64_t, gtirb::UUID>>>, std::tuple<uint8_t>, gtirb::UUID>>``` |


### encodings

| <!-- --> | <!-- -->                                       |
|----------|------------------------------------------------|
| Label    | ```"encodings"```                                |
| Type     | ```std::map<gtirb::UUID, std::string>```        |
| Key      | The gtirb::UUID of a data object. |
| Value    | The encoding of the data object.           |
| AttachedTo | gtirb::Module |
| Note     | Map from (typed) data objects to the encoding of the data,  expressed as a std::string containing an assembler encoding specifier: "string", "uleb128" or "sleb128". |


### elfSymbolVersions

| <!-- --> | <!-- -->                                       |
|----------|------------------------------------------------|
| Label    | ```"elfSymbolVersions"```                                |
| Type     | ```std::tuple<std::map<uint16_t, std::tuple<std::vector<std::string>, uint16_t>>, std::map<std::string, std::map<uint16_t, std::string>>, std::map<gtirb::UUID, std::tuple<uint16_t, bool>>>```        |
| Key      | The gtirb::UUID of a section. |
| Value    | The tuple with the ELF section types and flag.           |
| AttachedTo | gtirb::Module |
| Note     | Tuple with symbol version definitions, needed symbol versions, and a mapping of symbol UUIDs to symbol versions. Symbol version definitions are  `ElfSymDefs = std::map<SymbolVersionId, std::tuple<std::vector<std::string>>, uint16_t>`, a map from symbol version identifiers version definitions. These correspond to `ELFxx_Verdef` entries in the ELF section `.gnu.version_d`. The values in the map are tuples containing the list of versions strings and the verdef flags. The verdef flag may be `VER_FLG_BASE` (0x1), which indicates that the given version definiton is the file itself, and must not be used for matching a symbol. The first element of the list is the version itself, the subsequent elements are predecessor versions. The needed symbol versions are `ElfSymVerNeeded = std::map<std::string, std::map<SymbolVersionId, std::string>>`, a map from dynamic library names to the symbol versions that they need. For each library, we have a map from version identifiers to version strings. Finally, symbol UUIDs are mapped to symbol versions as `ElfSymbolVersionsEntries = std::map<gtirb::UUID, std::tuple<SymbolVersionId,bool>>`, where the `bool` represents the `HIDDEN` attribute. Symbol version identifiers are `SymbolVersionId = uint16_t` integers. |


### cfiDirectives

| <!-- --> | <!-- -->                                       |
|----------|------------------------------------------------|
| Label    | ```"cfiDirectives"```                                |
| Type     | ```std::map<gtirb::Offset, std::vector<std::tuple<std::string, std::vector<int64_t>, gtirb::UUID>>>```        |
| Key      | The gtirb::Offset of a cfi directive. |
| Value    | cfi directive contains: a string describing the directive, a vector  of numeric arguments, and an optional symbolic argument (represented with the UUID of the symbol           |
| AttachedTo | gtirb::Module |
| Note     | Map from Offsets to  vector of cfi directives. A cfi directive contains: a string describing the directive, a vector  of numeric arguments, and an optional symbolic argument (represented with the UUID of the symbol). |


### elfSymbolInfo

| <!-- --> | <!-- -->                                       |
|----------|------------------------------------------------|
| Label    | ```"elfSymbolInfo"```                                |
| Type     | ```std::map<gtirb::UUID, std::tuple<uint64_t, std::string, std::string, std::string, uint64_t>>```        |
| Key      | The gtirb::UUID of a symbol. |
| Value    | The type, binding, and visibility categories of the symbol.           |
| AttachedTo | gtirb::Module |
| Note     | On ELF targets only: Map from symbols to their type, binding, and visibility categories. |


### libraries

| <!-- --> | <!-- -->                                       |
|----------|------------------------------------------------|
| Label    | ```"libraries"```                                |
| Type     | ```std::vector<std::string>```        |
| Value    | The name of a library.           |
| AttachedTo | gtirb::Module |
| Note     | Names of the external libraries that are needed dynamically at run time. |


### libraryPaths

| <!-- --> | <!-- -->                                       |
|----------|------------------------------------------------|
| Label    | ```"libraryPaths"```                                |
| Type     | ```std::vector<std::string>```        |
| Value    | A path contained in the rpath of the binary.           |
| AttachedTo | gtirb::Module |
| Note     | Paths contained in the rpath of the binary. |


### binaryType

| <!-- --> | <!-- -->                                       |
|----------|------------------------------------------------|
| Label    | ```"binaryType"```                                |
| Type     | ```std::vector<std::string>```        |
| Value    | A binary type descriptor.           |
| AttachedTo | gtirb::Module |
| Note     | A set of binary type descriptors e.g. for ELF whether the binary is PIE "DYN" or not, "EXEC". PE binaries have additional descriptors, "DLL" or "EXE, and subsystem descriptor, e.g. WINDOWS_GUI or WINDOWS_CUI. |


### SCCs

| <!-- --> | <!-- -->                                       |
|----------|------------------------------------------------|
| Label    | ```"SCCs"```                                |
| Type     | ```std::map<gtirb::UUID, int64_t>```        |
| Key      | The gtirb::UUID of a block |
| Value    | The intra-procedural SCC identifier of the block.           |
| AttachedTo | gtirb::Module |
| Note     | The intra-procedural SCC identifier of each block. |


### symbolicExpressionSizes

| <!-- --> | <!-- -->                                       |
|----------|------------------------------------------------|
| Label    | ```"symbolicExpressionSizes"```                                |
| Type     | ```std::map<gtirb::Offset, uint64_t>```        |
| Key      | The gtirb::Offset of a symbolic expression. |
| Value    | The size of the expression, in bytes.           |
| AttachedTo | gtirb::Module |
| Note     | Map from an Offset of a symbolic expression in a ByteInterval to its extent, a size in bytes. |


### peImportEntries

| <!-- --> | <!-- -->                                       |
|----------|------------------------------------------------|
| Label    | ```"peImportEntries"```                                |
| Type     | ```std::vector<std::tuple<uint64_t, int64_t, std::string, std::string>>```        |
| Value    | A tuples containing details of an imported function.          |
| AttachedTo | gtirb::Module |
| Note     | List of tuples detailing an imported function address, ordinal, function name, and library names for PE. |


### peExportEntries

| <!-- --> | <!-- -->                                       |
|----------|------------------------------------------------|
| Label    | ```"peExportEntries"```                                |
| Type     | ```std::vector<std::tuple<uint64_t, int64_t, std::string>>```        |
| Value    | A tuples containing details of an exported function.          |
| AttachedTo | gtirb::Module |
| Note     | List of tuples detailing an exported address, ordinal, and name for PE. |


### peImportedSymbols

| <!-- --> | <!-- -->                                       |
|----------|------------------------------------------------|
| Label    | ```"peImportedSymbols"```                                |
| Type     | ```std::vector<gtirb::UUID>```        |
| Value    | gtirb::UUID of an imported symbol.           |
| AttachedTo | gtirb::Module |
| Note     | UUIDs of the imported symbols for PE. |


### peExportedSymbols

| <!-- --> | <!-- -->                                       |
|----------|------------------------------------------------|
| Label    | ```"peExportedSymbols"```                                |
| Type     | ```std::vector<gtirb::UUID>```        |
| Value    | gtirb::UUID of an exported symbol.           |
| AttachedTo | gtirb::Module |
| Note     | UUIDs of the exported symbols for PE. |


### peResource

| <!-- --> | <!-- -->                                       |
|----------|------------------------------------------------|
| Label    | ```"peResource"```                                |
| Type     | ```std::vector<std::tuple<std::vector<uint8_t>, gtirb::Offset, uint64_t>>```        |
| Value    | A resource header, data length, and data pointer.           |
| AttachedTo | gtirb::Module |
| Note     | List of PE resources. A resource header, data length, and data pointer. |

### profile

| <!-- --> | <!-- -->                                                 |
|----------|----------------------------------------------------------|
| Label    | ```"profile"```                                          |
| Type     | ```std::map<gtirb:UUID,uint64_t>```                      |
| Key      | The gtirb::UUID of a gtirb::CodeBlock.                   |
| Value    | The number of times that block was executed.             |
| AttachedTo | gtirb::Module                                          |
| Notes    | An entry in this table describes how many times a code block was executed. Blocks that are not present in this aux data table should be assumed to have a value of 0, indicating that they were not executed. |

### functionNameProbabilities

| <!-- -->   | <!-- -->                                                                                                                                                                                                                                |
|------------|-----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
| Label      | ```"functionNameProbabilities"```                                                                                                                                                                                                       |
| Type       | ```std::map<std::string, std::map<gtirb::UUID, std::vector<std::tuple<std::string, std::string, float>>>>```                                                                                                                            |
| Key        | Name of the tool that made the predictions.                                                                                                                                                                                             |
| Value      | Map from function UUID to a list of weighted predictions.  Each prediction is a tuple of <function name, binary name, score> where the score's meaning is tool dependent. Several existing tools use the convention that higher score is a better match and values ranging from 0.0 to 1.0.                                                      |
| AttachedTo | gtirb::Module                                                                                                                                                                                                                           |
| Notes      | Used to collect results from tools that identify functions and their source libraries.  Source library information is tracked in [includedLibraryNames](#includedlibrarynames) and [includedlibraryVersions](#includedlibraryversions). |


### includedLibraryNames

| <!-- -->   | <!-- -->                                 |
|------------|------------------------------------------|
| Label      | ```"includedLibraryNames"```             |
| Type       | ```std::map<gtirb::UUID, std::string>``` |
| Key        | Included library UUID.                   |
| Value      | The name of the library.                 |
| AttachedTo | gtirb::Module                            |
| Notes      | Names of libraries that are included in an executable (i.e., their code is intermingled with the executable code). |


### includedlibraryVersions

| <!-- -->   | <!-- -->                                                                                                              |
|------------|-----------------------------------------------------------------------------------------------------------------------|
| Label      | ```"includedLibraryVersions"```                                                                                       |
| Type       | ```std::map<gtirb::UUID, std::string>```                                                                              |
| Key        | Included library UUID.                                                                                                |
| Value      | Version string for the included library.                                                                              |
| AttachedTo | gtirb::Module                                                                                                         |
| Notes      | Versions of libraries that are included in an executable (i.e., their code is intermingled with the executable code). |


### sectionProperties

| <!-- --> | <!-- -->                                       |
|----------|------------------------------------------------|
| Label    | ```"sectionProperties"```                                |
| Type     | ```std::map<gtirb::UUID, std::tuple<uint64_t, uint64_t>>>>```        |
| Key      | The gtirb::UUID of a section. |
| Value    | The tuple with the ELF section types and flag.           |
| AttachedTo | gtirb::Module |
| Note     | Map from section UUIDs to tuples with the ELF section types and flags. |


### typeTable

| <!-- -->   | <!-- -->                                                                                                                                                                                                                                                                                                                    |
|------------|-----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
| Label      | ```"typeTable"```                                                                                                                                                                                                                                                                                                          |
| Type       | ```std::map<gtirb::UUID, std::variant<uint64_t, std::tuple<uint8_t>, std::tuple<int8_t, uint64_t>, uint64_t, uint64_t, std::tuple<gtirb::UUID, std::vector<gtirb::UUID>>, gtirb::UUID, std::tuple<gtirb::UUID, uint64_t>, tuple<uint64_t, std::vector<tuple<uint64_t, gtirb::UUID>>>, std::tuple<uint8_t>, gtirb::UUID>>``` |
| Key        | UUID of the type object                                                                                                                                                                                                                                                                                                     |
| Value      | Variant of the object type, where the variants field each represent: Unknown, Bool, Int, Char, Float, Function, Pointer, Array, Struct, Void, Alias, in that order.                                                                                                                                                         |
| AttachedTo | gtirb::Module                                                                                                                                                                                                                                                                                                               |
| Notes      | Contains structured type information about objects in the variant. Some empty tuples have been replaced with ```std::tuple<uint8_t>``` which is default-initialized to zero since some GTIRB implementations cannot store a 0-length tuple. The corresponding semantics of each type's variant field is the following:<br>- **Unknown**: ```uint64_t``` - Size of the unknown type<br>- **Bool**: ```std::tuple<uint8_t>``` - default initialized to zero<br>- **Int**: ```std::tuple<int8_t, uint64_t>``` - A tuple of signedness (1 for signed, 0 for unsigned) and width of int<br>- **Char**: ```uint64_t``` - Size of the character<br>- **Float**: ```uint64_t``` - size of the floating point number<br>- **Function**: ```std::tuple<gtirb::UUID, std::vector<gtirb::UUID>>``` - A tuple of return type UUID, and a list of parameter type UUIDs<br>- **Pointer**: ```gtirb::UUID``` - UUID of pointed-to type<br>- **Array**: ```std::tuple<gtirb::UUID, uint64_t>``` - A tuple of UUID of the elements of the array, and the number of element sin that array<br>- **Alias**: ```gtirb::UUID``` - The type being aliased (note this is effectively a `typedef`)<br>- **Struct**: ```tuple<uint64_t, std::vector<std::tuple<uint64_t, gtirb::UUID>>>``` - A tuple of the size of the structure in total, and a vector of its fields. Each field is represented as a tuple of the offset at which the field is located, and the UUID of the type of that field.<br>- **Void**: ```std::tuple<uint8_t>``` - default initialized to zero |

### prototypeTable


| <!-- -->   | <!-- -->                                   |
|------------|--------------------------------------------|
| Label      | ```"prototypeTable"```                     |
| Type       | ```std::map<gtirb::UUID, gtirb::UUID>```   |
| Key        | UUID of the function                       |
| Value      | UUID of the function type in the typeTable |
| AttachedTo | gtirb::Module                              |
| Notes      | Maps functions' UUIDs to their associated typeTable entry for the purpose of giving them prototypes. NOTE: The associated type table entry **must** be a Function type object. |


================================================
FILE: CHANGELOG.md
================================================
# 2.3.2 (Unreleased)

# 2.3.1

* Fix auxdata table `elfSectionProperties` to `sectionProperties` in the java api
  to match the cpp and python api
* Switched to use tox for testing the python API.

# 2.3.0

* Fixed a compatibility problem in the Python API that prevented using recent
  releases of protobuf. The Python API on PyPI now requires protobuf 4.21.1 or
  newer.
* Building the Python API now requires protobuf compiler version 3.19 or later
  for the generated definitions to be compatible with recent protobuf packages.
  The API can still be built with older protobuf compilers, but the result will
  not be compatible with recent protobuf packages.
* Added support in the C++ API for deserializing set AuxData into unordered_sets.
* Fixed issue causing compile errors when building with Boost 1.86+.
* Building the C++ API now requires Boost 1.68 or later.
* Fixed an obscure build error caused by a missing protobuf compiler. CMake now
  explicitly checks for the protobuf compiler before generating build files.

# 2.2.0

* Move the following utility functions into the `gtirb` namespace:
  `alignAddr`, `alignmentAdjustment`, `BumpPtrAllocator`, `isPowerOf2_64`,
  `SpecificBumpPtrAllocator`, `cast`, `cast_or_null`, `dyn_cast`,
  `dyn_cast_or_null`, `isa`. For backwards compatibility, these functions
  remain available, but deprecated, in the global namespace unless
  `GTIRB_WRAP_UTILS_IN_NAMESPACE` is defined.

# 2.1.0

* Stop generating debian metapackages and packages with the version attached
  to the package name. Updates in the apt-repository now support multiple
  package versions and upgrading `gtirb` with `apt-get upgrade`.
* Fix performance issue when checking references of ProxyBlocks in Python API.
* Add elfSoname AuxData definition
* ByteInterval's blocks' sort order is now thoroughly defined: offset, size,
  kind, decode mode, and UUID. Adjusting these properties during iteration may
  cause blocks to be skipped or visited twice.
* Added ByteInterval methods to the Python API to look up blocks by offset on.

# 2.0.0

* The Java API has been substantially reworked. Including:
  * Most of the core API classes now have a more polished interface.
  * The API for handling AuxData has been completely redesigned.
  * New testing infrastructure based on JUnit5 has been added.
  * More extensive test cases have been added.
* Add elfStackExec and elfStackSize AuxData definitions
* Add `IR.modules_named` helper method to Python API.
* Add `IR.findModules(String name)` helper method to Java API.

# 1.12.0

* Add elfDynamicInit and elfDynamicFini AuxData definitions

# 1.11.0

Note that this release, due to changes to the protobuf definitions of symbolic
expression attributes, is backwards-incompatible with previous GTIRB files.

* Replace symbolic expression attributes with composable labels.

# 1.10.9

* Added support for bool values in AuxData.
* Added elfSymbolVersions provisional AuxData definition.
* The GTIRB file format has changed to include a prefix containing a "magic"
  identifier and the GTIRB protobuf version number to allow easier id of
  GTIRB files. The change is not backwards compatible. Newer versions of
  GTIRB will not be able to load older GTIRB files.
* Converted the decode mode from an arbitrary integer into a ProtoBuf enum.
  This obviously breaks compatibility with older GTIRB files.

# 1.10.8

* Ubuntu 18 and gcc7 are no longer supported.


# 1.10.7

* Added support for floating-point numbers in AuxData.
* Disabled testing the Python API using `setup.py test`. The tests can still be
  run using ctest or Python's unittest module.
* Improved the performance of the Python API's ByteBlock.references property.
* Fixed a pair of bugs in C++ support for variants in AuxData

# 1.10.6

* Added type annotations to python API and made them available in package.
* Removed install-python target.

# 1.10.5

* Added various symbolic expression attributes.
* Updated Java API

# 1.10.4

* Removed SymStackConst support
* Added variant (union) support for AuxData
* Removed address and size from modules
* Modified Module::findSections(string) to return a range instead of iterator
* Added IR::findSection(string) to C++ API

# 1.10.3

* Added offset helpers to Python API
* Better support for `std::byte` when working with `ByteInterval`
* Fixed a bug which manifested when serializing a big-endian IR

# 1.10.2

* Updated "address" iteration order to compare size if addresses are the same
  and UUIDs if addresses and sizes are the same so that it can be used to
  store objects in ordered containers.
* Fixed some bugs where modifying an object's address or size would cause
  findNodeOn to return incorrect results.
* Improved performance of findNodeOn and findNodeAt queries.

# 1.10.1

* Added module-level endianess flag, for use in archtectures with multiple
  possible endians for its code blocks.
* Introduce iteration helpers cfgPredecessors and cfgSuccessors.

# 1.9.0

* Introduce attributes for symbolic expressions to the core IR.
* Reduce asymptotic complexity of iterating over blocks in a large number of
  byte intervals.
* Fixed bug where searching for blocks by address could return incorrect matches.
* Fixed bug where `ByteInterval::addBlock` would refuse to move an existing
  block to a new offset if it was already present.

# 1.8.5

* Make Python Offset objects immutable and make Offsets equivalent when they
  refer to the same displacement from the same element.

# 1.8.4

* Fix bug where Symbol iteration could get out of order when symbols refer to
  blocks in byte intervals that are relocated.

# 1.8.3

* Fix bug that didn't add CodeBlocks to the CFG if the CodeBlocks were added to
  a ByteInterval before it was added to the IR.

# 1.8.2

* The C++ API build no longer generates a `libgtirb.so.1` symlink. This has the
  effect of requiring clients to link against the full version number (e.g.,
  `libgtirb.so.1.8.2`) to ensure ABI compatibility while we continue to make
  rapid improvements to the library.

# 1.5.0

* In the Python API:
  * Removed `Node.from_uuid` and added `get_by_uuid` to `IR`s.
    This changes UUID lookup from a global cache to a per-IR cache;
    this means you can now have two IRs exist that share UUIDs but have
    different contents, for example.
  * Added convienience properties to all node types to find the parent nodes
    they belong to.

# 1.4.6

* Implement std::hash for Addr objects.

# 1.4.5

* Explicitly disable copy and move constructors for the Node class hierarchy in
  C++. This avoids a class of errors where nodes cannot be found by
  Node::getByUUID.

# 1.4.4

* Build/install libgtirb.so.1 symlink on linux.

# 1.4.3
* Remove the python-egg cmake target, add the python-wheel cmake target

# 1.4.2

* Don't use __declspec(dllimport) on Windows.

# 1.4.1

* Add ISA enums for PPC64, ARM64, MIPS32, and MIPS64.

# 1.3.2

* Access functions for converting to/from protobuf are no longer public in the C++ API.
* The proto library is no longer dllexported.
* GTIRB_EXPORT_API no longer uses dllimport on the client side.

# 1.3.1

* No longer installs Python files by default. Added a new 'install-python'
  target to install Python files.

# 1.3.0

* Added a new field to symbols, `at_end`, which allows symbols to point to the end
  of their referents as well as the beginning.

# 1.2.1

* Moved protobuf definitions into gtirb.proto package (gtirb::proto namespace
  in C++).
* Installing the Python API now respects CMAKE_INSTALL_PREFIX and DESTDIR with
  their usual semantics.

# 1.2.0

* AuxData and AuxDataContainer in the C++ API have been reworked to provide cleaner type safety.
  * AuxData is now retrieved directly from an AuxDataContainer using
	a schema class that specifies both the name of the AuxData object
	as well as its type.
  * Schemata for AuxData types must be registered at process startup
    before GTIRB objects are constructed or unserialized.

# 1.1.1

* Fixed a bug where changing the address of a block caused lookups of symbol
  by address to fail in some cases.

# 1.1.0

* Added a new API for accessing GTIRB, written in Java. This API is not yet
  released, and as such, has missing features, is not yet documented, and may
  change at any time. For more information, look at the contents of the `java`
  directory.

# 1.0.0

This is a major backwards-incompatible release.  The protobuf
specification has changed significantly resulting in protobuf version
1 which is now tracked in `version.txt` in the base of this
repository.  (The original protobuf version was version 0.)  The
changes in this release are primarily intended to enable *binary
rewriting* use cases on GTIRB.  Other changes to the protobuf
specification are for more general cleanup, simplification, and
clarification.  In addition, a new Common Lisp GTIRB API is now
included along with the C++ and Python APIs.  A list of specific
changes follows.  Complete documentation of all new objects and
structures is provided in the GTIRB manual.

* A `version` field is now present on GTIRB IR instances.  The value
  of this field is now `1`.  The old value of `0` is the protobuf
  default for a missing field.
* The control flow graph (CFG) is now a child of the IR instead of
  living under a specific module.  This means that a multi-module IR
  now has a single pan-module CFG.
* The `Block` object has been renamed to `CodeBlock` and the
  `DataObject` to `DataBlock`.
* A new object has been added to the GTIRB `Section`s named
  `ByteInterval`s.  This replaces the `ByteMap` in the previous GTIRB
  version.  A `ByteInterval` has:
  * An *optional* fixed address indicating its location in memory.
    Without an address the location of the `ByteInterval` is not
    specified allowing it to float to enable easier binary rewriting.
  * A `size` specifying the extend of the `ByteInterval` in memory.
    If this size is larger than the contents of the `ByteInterval`
    then the extension of the `ByteInterval` in memory beyond the end
    of the contents is un-allocated.
  * A byte vector named `contents` holding the contents of the `ByteInterval`.
  * A map from offsets to symbolic expressions.
  * A list of blocks holding `CodeBlock`s and `DataBlock`s.
* The `address` field has been removed from `Block`s.
* The `address` and `size` fields have been removed from `Section`s.
* An offset from the start of their `ByteInterval` have been added to blocks.
* The following fields have been removed from `Module`s:
  * `image_byte_map`
  * `symbolic_operands`
  * `blocks` and
  * `data`.
* An entry point stored as a `CodeBlock` has been added to `Module`s.
* A list of `ByteIntervals` has been added to `Section`s.
* The `ISAID` enumeration on module is renamed to `ISA`.
* Instead of an `AuxDataContainer` object we now hold a
  `map<string, AuxData>` on modules and IRs.
* The following GTIRB enumerations are modified: `ISA`, `FileFormat`,
  `SymbolKind`, and `SectionFlag`.  The goals of these modifications
  is to simplify the enumerations and ensure that all included options
  are both necessary and orthogonal.
* Sections now include have `SectionFlag`s to store common properties
  such as `readable`, `writeable`, or `executable`.

# 0.3.0

* You can now enable and disable the building of certain APIs when calling CMake,
  via the following flags:
  * `GTIRB_CXX_API` to control the building of the C++ API, on by default
  * `GTIRB_PY_API` to control the building of the Python API, on by default if `python3` is installed on your system
* The following changes have been made to the Python API:
  * `Serialization.decode` can now take a `bytes` object
    in addition to a `BytesIO` object.
  * If an unknwon type is encountered while decoding `AuxData`,
    it will be placed in `data` as a `bytes`-like object
    instead of throwing a `DecodeError`.
    Unknown data decoded this way can be then encoded again.
    It is still an error to encode unknown types of auxdata
    not in the manner described above.
* ImageByteMap::setData() has been extended to support arbitrary iterator types.
* We now build documentation for the Python API using
  [Sphinx](https://www.sphinx-doc.org/en/master/). To generate all
  documentation locally, call `make doc` after calling `cmake`; this will
  generate both C++ and Python API documentation. To only make one or the
  other, call `make doxy` or `make sphinx`, respectively.
  * Making the Sphinx documentation will require the following Python packages:
    ```bash
    pip3 install sphinx sphinx-autodoc-typehints
    ```

# 0.2.0

* Added a new Python API, meant to be a high-level wrapper over the
  Protobuf-generated one. To make use of it, add the `python` folder
  from your build directory to your `PYTHONPATH`. The package is named `gtirb`.
* CMake now won't automatically download and install its dependencies,
  so that the user has control over which versions are in use.
  The version requirements for Boost and Protobuf are listed in `README.md`.
* Updated the sanctioned AuxData definitions.
* Fix for build issue when using Boost 1.71.0.

# 0.1.1

* Initial public release.


================================================
FILE: CMakeLists.googletest
================================================
cmake_minimum_required(VERSION 2.8.2)

project(googletest-download NONE)

include(ExternalProject)
externalproject_add(
  googletest
  GIT_REPOSITORY https://github.com/google/googletest.git
  GIT_TAG v1.15.2
  SOURCE_DIR "${CMAKE_BINARY_DIR}/googletest-src"
  BINARY_DIR "${CMAKE_BINARY_DIR}/googletest-build"
  CONFIGURE_COMMAND ""
  BUILD_COMMAND ""
  INSTALL_COMMAND ""
  TEST_COMMAND ""
)


================================================
FILE: CMakeLists.txt
================================================
#
# Cmake Configuration
#

# Need 3.10 to support CXX_STANDARD=17 and protobuf::protoc
cmake_minimum_required(VERSION 3.10.0)

# The version.txt file is the official record of the version number. We use the
# contents of that file to set the project version for use in other CMake files.
file(READ "${CMAKE_CURRENT_SOURCE_DIR}/version.txt" ver)

string(REGEX MATCH "VERSION_MAJOR ([0-9]*)" _ ${ver})
set(GTIRB_MAJOR_VERSION ${CMAKE_MATCH_1})

string(REGEX MATCH "VERSION_MINOR ([0-9]*)" _ ${ver})
set(GTIRB_MINOR_VERSION ${CMAKE_MATCH_1})

string(REGEX MATCH "VERSION_PATCH ([0-9]*)" _ ${ver})
set(GTIRB_PATCH_VERSION ${CMAKE_MATCH_1})

string(REGEX MATCH "VERSION_PROTOBUF ([0-9]*)" _ ${ver})
set(GTIRB_PROTOBUF_VERSION ${CMAKE_MATCH_1})

cmake_policy(SET CMP0048 NEW)
project(
  GTIRB
  VERSION "${GTIRB_MAJOR_VERSION}.${GTIRB_MINOR_VERSION}.${GTIRB_PATCH_VERSION}"
)
set(PACKAGE_BRANCH master)

include(CheckFunctionExists)
include(CheckCXXSourceCompiles)
include(CheckIncludeFile)
include(Macros.cmake)
include(AlignOf.cmake)
include(CMakePackageConfigHelpers)

option(ENABLE_CONAN "Use Conan to inject dependencies" OFF)

if(ENABLE_CONAN)
  set(CONAN_SYSTEM_INCLUDES ON)
  include(${CMAKE_BINARY_DIR}/conanbuildinfo.cmake)
  conan_basic_setup()
endif()

# ---------------------------------------------------------------------------
# Build options
# ---------------------------------------------------------------------------

set(GTIRB_MSVC_PARALLEL_COMPILE_JOBS
    "0"
    CACHE
      STRING
      "Number of parallel compiler jobs used for Visual Studio compiles. 0 means use all processors. Default is 0."
)

option(GTIRB_ENABLE_TESTS "Enable building and running unit tests." ON)
option(GTIRB_ENABLE_MYPY "Enable checking python types with mypy." ON)

# This just sets the builtin BUILD_SHARED_LIBS, but if defaults to ON instead of
# OFF.
option(GTIRB_BUILD_SHARED_LIBS "Build shared libraries." ON)
if(GTIRB_BUILD_SHARED_LIBS)
  set(BUILD_SHARED_LIBS ON)
else()
  set(BUILD_SHARED_LIBS OFF)
endif()
if(UNIX AND NOT BUILD_SHARED_LIBS)
  # Find only static libraries
  set(CMAKE_FIND_LIBRARY_SUFFIXES ".a")
  add_compile_options(-static)
endif()

enable_testing()

# Set ENABEL_CODE_COVERAGE to default off, unless you want to test c++ coverage
option(ENABLE_CODE_COVERAGE
       "Build with instrumentation for collecting code coverage" OFF
)

if(ENABLE_CODE_COVERAGE)
  if(${CMAKE_CXX_COMPILER_ID} STREQUAL GNU OR ${CMAKE_CXX_COMPILER_ID} STREQUAL
                                              Clang
  )
    add_compile_options(--coverage)
    link_libraries(--coverage)
  else()
    message(FATAL_ERROR "no support for code coverage on this target")
  endif()
endif()

# Whether or not to run clang-tidy (if present)
option(GTIRB_RUN_CLANG_TIDY "Enable running of clang-tidy." ON)

# Define the cache variables for the API options.
option(GTIRB_CXX_API "Whether or not the C++ API is built." ON)
option(GTIRB_PY_API "Whether or not the Python API is built." ON)
option(GTIRB_CL_API "Whether or not the Common Lisp API is built." ON)
option(GTIRB_JAVA_API "Whether or not the Java API is built." ON)

# Determine whether or not to strip debug symbols and set the build-id. This is
# only really needed when we are building ubuntu *-dbg packages
option(GTIRB_STRIP_DEBUG_SYMBOLS
       "Whether or not to strip debug symbols and set the build-id." OFF
)

option(
  GTIRB_RELEASE_VERSION
  "Whether or not to build package versions without dev/SNAPSHOT suffixes.  Applies to the python and java APIs."
  OFF
)

# Determine whether or not the APIs are REALLY built or not.
# === C++ ===
set(CXX_API ${GTIRB_CXX_API})

# === Python ===
set(PY_API ${GTIRB_PY_API})
if(GTIRB_PY_API)
  gtirb_find_python()

  if(PYTHON)
    set(PYTHON_MINIMUM_VERSION "3.6")
    if("${Python3_VERSION}" VERSION_LESS "${PYTHON_MINIMUM_VERSION}")
      message(
        WARNING
          "${PYTHON} --version is ${Python3_VERSION}, which is less than the minimum required, ${PYTHON_MINIMUM_VERSION}; disabling building of API."
      )
      set(PY_API OFF)
    endif()
  else()
    message(
      WARNING
        "Python interpreter not found; disabling building of Python API.
If this is in error, try giving -DPYTHON=... to CMake to specify what program to use."
    )
    set(PY_API OFF)
  endif()
endif()

# === Common Lisp ===
# TODO: test the CL API on other CL interpreters and search for those in
# addition to SBCL when looking for a default CL interpeter
set(CL_API ${GTIRB_CL_API})
if(GTIRB_CL_API)
  find_program(LISP "sbcl")
  set(QUICKLISP
      "$ENV{HOME}/quicklisp"
      CACHE STRING "The Quicklisp installation to use."
  )
  set(LISP_MINIMUM_VERSION "1.4.5")

  if(NOT LISP)
    message(
      WARNING
        "Lisp interpreter not found; disabling building of Lisp API.
If this is in error, try giving -DLISP=... to CMake to specify what program to use."
    )
    set(CL_API OFF)
  elseif(NOT EXISTS "${QUICKLISP}")
    message(
      WARNING
        "Quicklisp installation not found; disabling building of Lisp API.
If this is in error, try giving -DQUICKLISP=... to CMake to specify what directory to use."
    )
    set(CL_API OFF)
  else()
    execute_process(COMMAND "${LISP}" "--version" OUTPUT_VARIABLE LISP_VERSION)
    string(REPLACE "SBCL" "" LISP_VERSION "${LISP_VERSION}")
    string(REPLACE ".debian" "" LISP_VERSION "${LISP_VERSION}")

    if("${LISP_VERSION}" VERSION_LESS "${LISP_VERSION}")
      message(
        WARNING
          "${LISP} --version is ${LISP_VERSION}, which is less then the minimum required, ${LISP_MINIMUM_VERSION}; disabling building of API."
      )
      set(CL_API OFF)
    endif()
  endif()
endif()

# === Java ===
set(JAVA_API ${GTIRB_JAVA_API})
if(GTIRB_JAVA_API)
  find_package(Java 1.8.0 COMPONENTS Development)
  if(NOT JAVA_FOUND)
    message(WARNING "Java 8 compiler not found; disabling building of Java API.
If this is in error, try setting the environment variable $JAVA_HOME."
    )
    set(JAVA_API OFF)
  else()
    find_program(MVN mvn)
    if(NOT MVN)
      message(
        WARNING
          "Maven not found; disabling building of Java API. If this is in "
          "error, try setting -DMVN=<path-to-maven> on the CMake command-line"
      )
      set(JAVA_API OFF)
    endif()
  endif()
endif()

# Documentation options.
option(GTIRB_DOCUMENTATION "Whether or not documentation is built." ON)

# ---------------------------------------------------------------------------
# Global settings
# ---------------------------------------------------------------------------

set_property(GLOBAL PROPERTY USE_FOLDERS ON)
set(CMAKE_MODULE_PATH ${CMAKE_CURRENT_SOURCE_DIR}/src)
if(WIN32)
  set(CMAKE_DEBUG_POSTFIX
      "d"
      CACHE STRING "add a postfix, usually d on windows"
  )
endif()
set(CMAKE_RELEASE_POSTFIX
    ""
    CACHE STRING "add a postfix, usually empty on windows"
)
set(CMAKE_RELWITHDEBINFO_POSTFIX
    ""
    CACHE STRING "add a postfix, usually empty on windows"
)
set(CMAKE_MINSIZEREL_POSTFIX
    ""
    CACHE STRING "add a postfix, usually empty on windows"
)
set(CMAKE_ARCHIVE_OUTPUT_DIRECTORY ${CMAKE_BINARY_DIR}/lib)
set(CMAKE_LIBRARY_OUTPUT_DIRECTORY ${CMAKE_BINARY_DIR}/lib)
set(CMAKE_RUNTIME_OUTPUT_DIRECTORY ${CMAKE_BINARY_DIR}/bin)

if(CXX_API)
  # Use C++17
  set(CMAKE_CXX_STANDARD 17)
  # Error if it's not available
  set(CMAKE_CXX_STANDARD_REQUIRED ON)

  # Specifically check for gcc-7 or later. gcc-5 is installed on many systems
  # and will accept -std=c++17, but does not fully support the standard.
  if(CMAKE_CXX_COMPILER_ID STREQUAL "GNU")
    if(CMAKE_CXX_COMPILER_VERSION VERSION_LESS "7.0.0")
      message(FATAL_ERROR "gcc 7 or later is required to build gtirb")
    endif()
  endif()

  set(CMAKE_CXX_VISIBILITY_PRESET hidden)

  #
  # Global Options (Compile / Link)
  #
  add_compile_options(-DBOOST_MULTI_INDEX_DISABLE_SERIALIZATION)

  # MSVC-specific Options
  if(${CMAKE_CXX_COMPILER_ID} STREQUAL MSVC)
    if(NOT GTIRB_MSVC_PARALLEL_COMPILE_JOBS STREQUAL "1")
      if(GTIRB_MSVC_PARALLEL_COMPILE_JOBS STREQUAL "0")
        add_compile_options(-MP)
        message(STATUS "Parallel compilation enabled")
      else()
        add_compile_options(-MP${GTIRB_MSVC_PARALLEL_COMPILE_JOBS})
        message(
          STATUS
            "Parallel compilation with ${GTIRB_MSVC_PARALLEL_COMPILE_JOBS} jobs"
        )
      endif()
    else()
      message(STATUS "Parallel compilation disabled")
    endif()

    add_compile_options(-D_CRT_SECURE_NO_WARNINGS)
    add_compile_options(-D_MBCS)
    add_compile_options(-D_SCL_SECURE_NO_WARNINGS)
    # We need to add both so that there is not a mismatch between Win32 SDK
    # headers (which use UNICODE) and C Standard Library headers (which use
    # _UNICODE).
    add_compile_options(-D_UNICODE)
    add_compile_options(-DUNICODE)
    add_compile_options(-D_WIN32)
    # Disable macro definitions for min and max that conflict with the STL.
    add_compile_options(-DNOMINMAX)
    # Enable RTTI. FIXME: stop using typeid so we can disable this and add -fno-
    # rtti to the Clang/GCC compiler options.
    add_compile_options(-GR)
    # Enable exceptions, which are basically required because of our reliance on
    # boost.
    add_compile_options(-EHsc)
    # Enabled a sensible warning level and treat all warnings as errors.
    add_compile_options(-W4)
    add_compile_options(-WX)

    # Enable bigobj support, otherwise IR.cpp and Module.cpp will refuse to
    # compile due to execeeding the number of sections allowed in an object
    # file. FIXME: we should not have that many template instantiations.
    add_compile_options(-bigobj)

    add_compile_options(-sdl) # Enable extra security checks
    add_compile_options(-permissive-) # Disable permissive mode

    add_compile_options(-wd4996) # VC8: Deprecated libc functions.
    # This is a warning about a change in behavior from old versions of visual
    # c++.  We want the new (standard-compliant) behavior, so we don't want the
    # warning.  The warning is that using an array in a class initializer list
    # will cause its elements to be default initialized.
    add_compile_options(-wd4351)
    add_compile_options(-wd4146) # unary minus operator applied to unsigned
                                 # type, result still unsigned

    # C4505: 'google::protobuf::internal::MapField<...>::ContainsMapKey':
    # unreferenced local function has been removed
    add_compile_options(-wd4505)

    # C4267: protobuf-generated headers, at least w/ protobuf 3.9.1, trigger
    # MSVC's "conversion from 'size_t' to 'int', possible loss of data" warning.
    add_compile_options(-wd4267)

    # Release target options
    add_compile_options($<$<CONFIG:Release>:-GL>) # Enable whole program
                                                  # optimization
    add_link_options($<$<CONFIG:Release>:-ltcg>) # Enable link-time code
                                                 # generation
  elseif((${CMAKE_CXX_COMPILER_ID} STREQUAL GNU) OR (${CMAKE_CXX_COMPILER_ID}
                                                     STREQUAL Clang)
  )
    add_compile_options(-Wall -Wextra -Wpointer-arith -Wshadow -Werror)
    add_compile_options(-fPIC)
  endif()
endif()

# ---------------------------------------------------------------------------
# Boost
# ---------------------------------------------------------------------------
if(CXX_API)
  find_package(Boost 1.68 REQUIRED)

  add_compile_options(-DBOOST_CONFIG_SUPPRESS_OUTDATED_MESSAGE)
  add_compile_options(-DBOOST_SYSTEM_NO_DEPRECATED)

  # Boost versions 1.70.0+ may use Boost's provided CMake support rather than
  # CMake's internal Boost support. The former uses "Boost::boost" and so on,
  # while the latter uses "Boost_BOOST" and so on. This normalizes the two cases
  # to use Boost_INCLUDE_DIRS and Boost_LIBRARIES.
  if(TARGET Boost::headers)
    get_target_property(
      Boost_INCLUDE_DIRS Boost::headers INTERFACE_INCLUDE_DIRECTORIES
    )
  endif()

  include_directories(SYSTEM ${Boost_INCLUDE_DIRS})
endif()

# ---------------------------------------------------------------------------
# Google Test Application
# ---------------------------------------------------------------------------
if(GTIRB_ENABLE_TESTS AND CXX_API)
  # Pull in Google Test
  # https://github.com/google/googletest/tree/master/googletest#incorporating-
  # into-an-existing-cmake-project

  # Download and unpack googletest at configure time
  configure_file(CMakeLists.googletest googletest-download/CMakeLists.txt)

  execute_process(
    COMMAND "${CMAKE_COMMAND}" -G "${CMAKE_GENERATOR}" .
    RESULT_VARIABLE result
    WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/googletest-download"
  )

  if(result)
    message(WARNING "CMake step for googletest failed: ${result}")
  endif()

  execute_process(
    COMMAND "${CMAKE_COMMAND}" --build .
    RESULT_VARIABLE result
    WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/googletest-download"
  )

  if(result)
    message(WARNING "Build step for googletest failed: ${result}")
  endif()

  # Prevent overriding the parent project's compiler/linker settings on Windows
  set(gtest_force_shared_crt
      ON
      CACHE BOOL "" FORCE
  )

  # Add googletest directly to our build. This defines the gtest and gtest_main
  # targets.
  add_subdirectory(
    "${CMAKE_BINARY_DIR}/googletest-src" "${CMAKE_BINARY_DIR}/googletest-build"
    EXCLUDE_FROM_ALL
  )

  include_directories("${gtest_SOURCE_DIR}/include")
endif()

# ---------------------------------------------------------------------------
# JUnit Test Application
# ---------------------------------------------------------------------------
if(GTIRB_ENABLE_TESTS AND JAVA_API)
  include(ExternalProject)
  externalproject_add(
    junit
    PREFIX ${CMAKE_BINARY_DIR}/junit
    URL "https://repo1.maven.org/maven2/org/junit/platform/junit-platform-console-standalone/1.10.0/junit-platform-console-standalone-1.10.0.jar"
    CONFIGURE_COMMAND ""
    BUILD_COMMAND ""
    INSTALL_COMMAND ""
    TEST_COMMAND ""
    DOWNLOAD_NO_EXTRACT ON
  )

  set(JUNIT_STANDALONE_JAR
      ${CMAKE_BINARY_DIR}/junit/src/junit-platform-console-standalone-1.10.0.jar
  )
endif()

# ---------------------------------------------------------------------------
# protobuf
# ---------------------------------------------------------------------------
if(CL_API)
  find_package(Protobuf 3.7.0 REQUIRED)
else()
  find_package(Protobuf 3.0.0 REQUIRED)
endif()
if(NOT Protobuf_PROTOC_EXECUTABLE)
  # find_package only fails if the protobuf libraries or headers cannot be
  # found. It does not treat failing to find the protobuf compiler as an error,
  # so we do that explicitly here.
  message(
    FATAL_ERROR
      "Could not find Protobuf compiler 'protoc'. Please make sure the "
      "Protobuf compiler is installed."
  )
endif()

if(Protobuf_VERSION VERSION_LESS 3.2)
  add_definitions(-DPROTOBUF_SET_BYTES_LIMIT)
endif()

if(NOT BUILD_SHARED_LIBS)
  set(Protobuf_USE_STATIC_LIBS ON)
endif()
include_directories(SYSTEM ${PROTOBUF_INCLUDE_DIRS})

add_subdirectory(proto)

# ---------------------------------------------------------------------------
# gtirb sources
# ---------------------------------------------------------------------------
if(CXX_API)
  add_subdirectory(src)
endif()

if(PY_API)
  add_subdirectory(python)
endif()

if(CL_API)
  add_subdirectory(cl)
endif()

if(JAVA_API)
  add_subdirectory(java)
endif()

if(GTIRB_DOCUMENTATION)
  add_subdirectory(doc)
endif()

# ---------------------------------------------------------------------------
# Export config for use by other CMake projects
# ---------------------------------------------------------------------------

if(CXX_API)
  # --- For direct use from the build directory/cmake registry ---
  # This exports the targets
  export(TARGETS gtirb gtirb_proto
         FILE "${CMAKE_CURRENT_BINARY_DIR}/gtirbTargets.cmake"
  )
  # This is the main config file that find_package will look for.
  configure_file(
    "${CMAKE_CURRENT_LIST_DIR}/gtirbConfig.cmake.in"
    "${CMAKE_CURRENT_BINARY_DIR}/gtirbConfig.cmake" @ONLY
  )
  # Add the build directory to the user CMake registry, so find_package can
  # locate it automatically.
  export(PACKAGE gtirb)

  # --- For the installed copy ---
  # Main config file for find_package, includes the targets file and defines the
  # check_gtirb_branch function.
  if(NOT DEFINED PACKAGE_BRANCH)
    set(PACKAGE_BRANCH "No package branch specified")
  endif()
  # FIXME: The installed version of gtirbConfig currently contains the
  # check_gtirb_branch function, which requires users to explicitly call it. We
  # ought to move this functionality to gtirbConfig-version, so that checking
  # the gtirb version also checks the branch, requiring users to opt-out of the
  # branch check, rather than opt-in by calling check_gtirb_branch. See: GitLab
  # issue #93
  configure_file(
    "${CMAKE_CURRENT_LIST_DIR}/gtirbConfig.cmake.in"
    "${CMAKE_CURRENT_BINARY_DIR}/export/gtirbConfig.cmake" @ONLY
  )

  # In this mode, find_package also seems to require a version file
  set(version_file "${CMAKE_CURRENT_BINARY_DIR}/gtirbConfig-version.cmake")
  write_basic_package_version_file(
    ${version_file}
    VERSION ${GTIRB_VERSION}
    COMPATIBILITY AnyNewerVersion
  )

  # Copy the config files to the install location
  install(
    FILES ${CMAKE_CURRENT_BINARY_DIR}/export/gtirbConfig.cmake ${version_file}
    DESTINATION lib/gtirb
    COMPONENT cmake_config
  )
  # This exports the targets to the install location.
  install(
    EXPORT gtirbTargets
    COMPONENT cmake_target
    DESTINATION lib/gtirb
  )
endif()

# ---------------------------------------------------------------------------
# Package policy enforcement
# ---------------------------------------------------------------------------

if(GTIRB_PACKAGE_POLICY)
  set(PACKAGE_POLICY ${GTIRB_PACKAGE_POLICY})
elseif(ENABLE_CONAN OR WIN32)
  set(PACKAGE_POLICY conan)
else()
  set(PACKAGE_POLICY unix)
endif()

if(PACKAGE_POLICY STREQUAL "unix")

  # Provides copyright file for Unix packages.
  install(
    FILES ${CMAKE_SOURCE_DIR}/LICENSE.txt
    COMPONENT license
    DESTINATION share/doc/gtirb
    RENAME copyright
  )

elseif(PACKAGE_POLICY STREQUAL "conan")

  # Provides LICENSE.txt for Conan packages
  install(
    FILES ${CMAKE_SOURCE_DIR}/LICENSE.txt
    COMPONENT license
    DESTINATION licenses
  )

endif()

# ---------------------------------------------------------------------------
# Package generation with cpack
# ---------------------------------------------------------------------------
set(CPACK_PROJECT_CONFIG_FILE ${CMAKE_CURRENT_SOURCE_DIR}/cpack-config.cmake)

set(CMAKE_PROJECT_HOMEPAGE_URL https://github.com/GrammaTech/gtirb)
set(CPACK_PACKAGE_VERSION_MAJOR ${GTIRB_MAJOR_VERSION})
set(CPACK_PACKAGE_VERSION_MINOR ${GTIRB_MINOR_VERSION})
set(CPACK_PACKAGE_VERSION_PATCH ${GTIRB_PATCH_VERSION})
set(CPACK_PACKAGE_VENDOR "GrammaTech Inc.")
set(CPACK_PACKAGE_CONTACT gtirb@grammatech.com)
set(CPACK_PACKAGE_DESCRIPTION_FILE ${CMAKE_CURRENT_SOURCE_DIR}/README.md)
set(CPACK_PACKAGE_RESOURCE_FILE_LICENSE ${CMAKE_CURRENT_SOURCE_DIR}/LICENSE.md)
set(CPACK_PACKAGE_DESCRIPTION_SUMMARY
    "The GrammaTech Intermediate Representation for Binaries (GTIRB) is a machine code analysis and rewriting data structure."
)
set(CPACK_DEBIAN_PACKAGE_SECTION devel)

string(REGEX MATCH "([^\.]+)\.([^\.]+)\.([^\.]+)" PROTOBUF_VERSION_MATCH
             ${Protobuf_VERSION}
)
set(PROTOBUF_MAJOR_VERSION ${CMAKE_MATCH_1})
set(PROTOBUF_MINOR_VERSION ${CMAKE_MATCH_2})
set(PROTOBUF_PATCH_VERSION ${CMAKE_MATCH_3})
math(EXPR NEXT_PROTOBUF_PATCH "${PROTOBUF_PATCH_VERSION}+1")
set(CPACK_PROTOBUF_VERSION_UPPER_BOUND
    "${PROTOBUF_MAJOR_VERSION}.${PROTOBUF_MINOR_VERSION}.${NEXT_PROTOBUF_PATCH}"
)
set(CPACK_PROTOBUF_VERSION_LOWER_BOUND "${Protobuf_VERSION}")
set(CPACK_GTIRB_VERSION "${GTIRB_VERSION}")
set(CPACK_SOURCE_DIR ${CMAKE_SOURCE_DIR})

include(CPack)

# ---------------------------------------------------------------------------
# Report APIs and features built
# ---------------------------------------------------------------------------

message("APIs to be built:")
message("    C++     ${CXX_API}")
message("    Python  ${PY_API}")
message("    Lisp    ${CL_API}")
message("    Java    ${JAVA_API}")


================================================
FILE: CODE_OF_CONDUCT.md
================================================
# Contributor Covenant Code of Conduct

## Our Pledge

In the interest of fostering an open and welcoming environment, we as
contributors and maintainers pledge to making participation in our project and
our community a harassment-free experience for everyone, regardless of age, body
size, disability, ethnicity, sex characteristics, gender identity and expression,
level of experience, education, socio-economic status, nationality, personal
appearance, race, religion, or sexual identity and orientation.

## Our Standards

Examples of behavior that contributes to creating a positive environment
include:

* Using welcoming and inclusive language
* Being respectful of differing viewpoints and experiences
* Gracefully accepting constructive criticism
* Focusing on what is best for the community
* Showing empathy towards other community members

Examples of unacceptable behavior by participants include:

* The use of sexualized language or imagery and unwelcome sexual attention or
  advances
* Trolling, insulting/derogatory comments, and personal or political attacks
* Public or private harassment
* Publishing others' private information, such as a physical or electronic
  address, without explicit permission
* Other conduct which could reasonably be considered inappropriate in a
  professional setting

## Our Responsibilities

Project maintainers are responsible for clarifying the standards of acceptable
behavior and are expected to take appropriate and fair corrective action in
response to any instances of unacceptable behavior.

Project maintainers have the right and responsibility to remove, edit, or
reject comments, commits, code, wiki edits, issues, and other contributions
that are not aligned to this Code of Conduct, or to ban temporarily or
permanently any contributor for other behaviors that they deem inappropriate,
threatening, offensive, or harmful.

## Scope

This Code of Conduct applies within all project spaces, and it also applies when
an individual is representing the project or its community in public spaces.
Examples of representing a project or community include using an official
project e-mail address, posting via an official social media account, or acting
as an appointed representative at an online or offline event. Representation of
a project may be further defined and clarified by project maintainers.

## Enforcement

Instances of abusive, harassing, or otherwise unacceptable behavior may be
reported by contacting the project team at gtirb-conduct@grammatech.com. All
complaints will be reviewed and investigated and will result in a response that
is deemed necessary and appropriate to the circumstances. The project team is
obligated to maintain confidentiality with regard to the reporter of an incident.
Further details of specific enforcement policies may be posted separately.

Project maintainers who do not follow or enforce the Code of Conduct in good
faith may face temporary or permanent repercussions as determined by other
members of the project's leadership.

## Attribution

This Code of Conduct is adapted from the [Contributor Covenant][homepage], version 1.4,
available at https://www.contributor-covenant.org/version/1/4/code-of-conduct.html

[homepage]: https://www.contributor-covenant.org

For answers to common questions about this code of conduct, see
https://www.contributor-covenant.org/faq


================================================
FILE: CONTRIBUTING.md
================================================
Contributing
============


## Code of Conduct

Please read the [GTIRB Code of Conduct](CODE_OF_CONDUCT.md).

## General Guidelines

- Text files may not have trailing whitespace.

- Text files must end with a trailing newline.

- All tests should be able to run and pass.
  This can be checked by running `make check` on your build directory
  after running `cmake`.

- All CMake files shall be formatted with
  [cmake-format](https://pypi.org/project/cmake-format/).  A
  `.cmake-format` file is provided in the root directory for the
  project, and a pass through this tool is included as part of our
  `pre-commit` configuration (see below for details).

- The GTIRB version saved in `version.txt` uses
  [semantic versioning](https://semver.org)

- We also track a Protobuf version number in `version.txt` (as
  `VERSION_PROTOBUF`).  This number is incremented whenever our
  protobuf files (under `proto/` in the GTIRB repository) are changed
  in any way that affects the serialized protobuf -- even if the
  change could potentially be backwards compatible because of the way
  protobuf gracefully handles unknown new fields.

- We ask that all contributors complete our Contributor License
  Agreement (CLA), which can be found at
  [GrammaTech-CLA-GTIRB.pdf](./GrammaTech-CLA-GTIRB.pdf), and email
  the completed form to `CLA@GrammaTech.com`.  Under this agreement
  contributors retain the copyright to their work but grants
  GrammaTech unlimited license to the work.

### pre-commit

In general, code must follow a unified format. To make compliance with
this format easier, we recommend the use of
[`pre-commit`](https://pre-commit.com/) with the provided
configuration file, `.pre-commit-config.yaml`, to manage formatting.
To use `pre-commit`:

1. If `pre-commit` is not already installed on your system, install it
   now with [`pip`](https://pypi.org/project/pip/).
   ```shell
      pip3 install pre-commit
   ```
2. If [`clang-format`](https://clang.llvm.org/docs/ClangFormat.html)
   is not already installed on your system, install it now.
3. Install the formatters as a pre-commit hook. In the gtirb root directory:
   ```shell
    pre-commit install
   ```
   If you prefer to run `pre-commit` manually instead, run this before all commits:
   ```shell
   pre-commit run
   ```

## C++ Code Requirements

- All code shall be formatted with [clang-format](https://clang.llvm.org/docs/ClangFormat.html).
  A `.clang-format` is provided in the root directory for the project,
  and a pass through this tool is included as part of our `pre-commit` configuration.

- Code should generally follow the C++ Core Guidelines recommendations.

- Code should generally allow for thread safety.
	- No static variables.
	- No globals
	- Free functions should not maintain state.
	- Use caution when using iterators to guard against invalidation.

- Maintain const-correctness.

- Use UpperCamelCase for type names.

- Use UpperCamelCase for enum members.

- Use UpperCamelCase for variable and class members.

- Use lowerCamelCase for function and method names.

- Avoid `using namespace std`

- Use `auto` when the deduced type is explicitly spelled out in the
  initialization or if the deduced type is an abstract type
  alias.  Always explicitly specify type qualifiers, pointers, and
  references.  E.g.,
  ```cpp
  const auto *Ptr = dynamic_cast<const Foo *>(SomePtr);
  auto Val = static_cast<unsigned>(SomeValue);
  for (auto Iter = SomeContainer.begin(), End = SomeContainer.end(); Iter != End; ++Iter) {}
  ```

- Use `auto` to make code more readable, but prefer `auto &` or `auto *`
  to avoid unexpected copies.

- `#include` as little as possible to reduce compile times. Use
  forward declarations of classes when possible to avoid including
  their definitions.

- Do not introduce variables to the code that would require a client
  to dllimport them. Export.hpp does not setup dllimport declarations
  for clients. For example, do not add static function-local variables
  in inline functions in header files.

## Build Performance Tips

Some tips to keep in mind to not needlessly regress build performance when
working with GTIRB:

- Do not include a protobuf header from within a .hpp file unless you need the
  enum values from protobuf. A forward declare + include in the .cpp file is
  sufficient and cuts out 100s of transitive headers to parse.
- CFG.hpp and ByteInterval.hpp are the most expensive headers you can possibly
  include. Avoid including these whenever humanly possible (getting rid of 2
  includes of CFG.hpp cut out ~2500 transitive header includes).
- Boost headers are extremely heavy to parse, try to push as much of their
  inclusions down into a .cpp file as possible. For instance, including boost's
  endian header requires ~200 transitive headers by itself. Things like the
  boost containers are considerably more expensive. This is what contributes to
  ByteInterval and CFG being so expensive to include. Be wary when adding
  includes to boost headers or adding new boost dependencies.
- Do not blindly trust the output from tools like include what you use; they
  sometimes do silly things like include a header file when a forward declare is
  sufficient. When adding an include to a .hpp file, try hard to avoid adding
  the include.

### Testing Development

- All code you care about should be tested.
- Any code you don't care about should be removed.
- C++ code should be tested on Linux using GCC and Clang, and on Windows using Visual Studio.
- Code testing is done via Google Test.
- Test names are prefixed with the type of test they are (`Unit_`, `System_`, `Integration_`).
- No unit test should take more than 0.5 seconds.

## Building under Windows

Most of the build issues on Windows arise from having to define the location of
many dependencies.

### Troubleshooting
- When using a batch file to call `cmake`, make sure to quote all paths and
  escape all backshlases in paths.  i.e. `-DCMAKE_PREFIX_PATH="c:\\Program
Files\\capstone"` and do not leave a trailing backslash on paths.
- Use `-Dprotobuf_DEBUG=ON` for protobuf related build issues in general.
- `'../src/gtirb/proto/protobuf::protoc', needed by
  'src/gtirb/proto/AuxData.pb.h', missing and no known rule to make it`
  - due to missing or unusable protoc protobuf compiler.  You may need to define
    `-Dprotobuf_EXECUTABLE="<path to protoc.exe>"`, or check that the
CMAKE_PREFIX_PATH has a path to the protobuf dir (resulting from `ninja install`
after building).
- `CMAKE_PREFIX_PATH` is not additive.  If you set it again, it will silently
  overwrite prior settings.  Add to the one definition, separtaing with
semi-colons.

## Python Code Requirements

- Code must be [PEP8](https://www.python.org/dev/peps/pep-0008/) compliant.
  To check for PEP8 compliance, [flake8](https://pypi.org/project/flake8/) is recommended,
  and included as part of our `pre-commit` configuration.

- All code must be formatted with [Black](https://pypi.org/project/black/)
  (set to line lengths of 79, for PEP8 compliance).
  A pass through this tool is included as part of our `pre-commit` configuration.

- The Python API should be made to run on all versions of Python 3.

- Use `UpperCamelCase` for type names, `UPPER_CASE` for constant names,
  and `snake_case` for other identifier names.

### Testing Development

- All code you care about should be tested.
- Any code you don't care about should be removed.
- Code testing is done via the built-in `unittest` framework.
- Code testing uses [`tox`](https://tox.wiki/en/stable/) and
  [`pytest`](https://docs.pytest.org/en/stable/) to simplify testing supported
  configurations.
- No unit test should take more than 0.5 seconds.

## Documentation

The GTIRB documentation consists of complete documentation for all
components of the GTIRB API, along with examples and other usage
information.


### Building Documentation

At minimum, you will need [CMake](https://cmake.org/) and
[Doxygen](http://www.doxygen.nl/). To build the documentation:

1. Create and change to a temporary build directory. We will refer to
   this directory as `build`.

   ```bash
   > mkdir build
   > cd build
   ```

2. Build the documentation.

   ```bash
   build> cmake <PATH_TO_GTIRB> [<api_options>]
   build> cmake --build . --target doc
   ```

3. Open the documentation home page `build/doc/html/index.html`
   in your browser.


The `<api_options>` are as follows

- `-DGTIRB_CXX_API=OFF` : do not generate C++ API documentation.

  If this option is not specified, `cmake` will attempt to generate
  C++ API documentation, failing (along with the documentation build
  as a whole) if [Doxygen](http://www.doxygen.nl/) is not available.


- `-DGTIRB_CL_API=OFF` : do not generate Common Lisp API documentation.

  If this option is not specified, `cmake` will attempt to generate
  Common Lisp API documentation if and only if it can locate a
  SBCL/Quicklisp installation, failing if
  [simpler-documentation-template
  (SDT)](https://github.com/eschulte/simpler-documentation-template)
  is not available.

- `-DGTIRB_PY_API=OFF` : do not generate Python API documentation.

  If this option is not specified, `cmake` will attempt to generate
  Python API documentation if and only if it can locate a Python
  installation, failing if [Sphinx](https://www.sphinx-doc.org/en/master/),
  [sphinx-autodoc-typehints](https://pypi.org/project/sphinx-autodoc-typehints/),
  or the Python API dependencies are not available.


### Contributing Markdown Documentation

To add a new markdown document to the documentation:

1. Create the new document as a child of `/doc`.
   - File names start with `gtirb`.
   - File extension is `.md`.
   - Use github markdown syntax.
   - Wrap your markdown documents at 80 columns.

2. Edit `/doc/general/Doxyfile.in` to add the basename of your new markdown
   document to the `INPUT` rule setting.

3. Edit `/doc/general/CMakeLists.txt` to add your new markdown document
   to  `MDFILES_IN`. Ordering is not important.

4. Integrate your new markdown document into the documentation, either
   by linking to it from an existing page or by updating
   `/doc/general/DoxygenLayout.xml` to add an entry to the **More Information**
   tab.

5. [Build the documentation](#building-documentation) and check that
   your new page is present and rendered correctly.
   - If it is not rendered correctly, you may need to add a new
     preprocessing step to `doc/general/preprocmd.py` to rewrite the
     corresponding github-style markdown into something Doxygen
     can handle correctly.

### Graphviz

- File names start with `gtirb`.
- The color palette is `black`, `lightblue`, `cornflowerblue`, and `coral`.
- Render `.dot` files to the same file name with a `.png` extension.
	* Example: `dot -Tpng gtirbScope.dot > gtirbScope.png`
- Use the `arial` font.

### Python

For the Python API, [Sphinx](https://www.sphinx-doc.org/en/master/)
and [related plugins](https://pypi.org/project/sphinx-autodoc-typehints/)
are required. To install these via [pip](https://pip.pypa.io/en/stable/), run:

```bash
pip3 install sphinx sphinx-autodoc-typehints
```

You will also need all the dependencies of the GTIRB Python API
itself. If you haven't already installed the Python API (and don't
want to do so now) you can install just its dependencies as follows.

```bash
cd <PATH_TO_GTIRB>/build/python
python3 setup.py egg_info
pip3 install -r gtirb.egg-info/requires.txt
```

### Common Lisp

For the Common Lisp API, [simpler-documentation-template (SDT)](https://github.com/eschulte/simpler-documentation-template)
is required. This package should automatically be downloaded via the build process;
see `cl/README.md` for details on how to prepare the Common Lisp API.


================================================
FILE: FAQ.md
================================================
Frequently Asked Questions
--------------------------

- [I get compiler errors when I try to compile programs using GTIRB. How can I make them go away?](#compiler-errors)

- [Linking error with "undefined reference" to gtirb::](#linking-error-with-undefined-reference-to-gtirb)

#### Compiler Errors

__Q: I get compiler errors when I try to compile programs using GTIRB. How can I make them go away?__

A: GTIRB requires C++17, including the C++17 standard library. If your
compiler does not use C++17 by default, you will need to explicitly
specify it when compiling programs that use GTIRB.

For example:
```
g++ --std=c++17 my_gtirb_program.cpp -lgtirb -o my_gtirb_program
```


#### Linking error with "undefined reference" to gtirb

__Q: I get linker errors when I try to compile and link programs using GTIRB. How can I make them go away?__

A: This isn't GTIRB specific, but if you place the `-lgtirb` on your
compilation line *before* the source file the linker will sometimes
throw away the symbols from the GTIRB library which it doesn't think
it needs (and if it hasn't read your source yet it won't think it
needs much).  So if for example,

```
g++ --std=c++17 -lgtirb my_gtirb_program.cpp
```

doesn't work for you, then try this instead.

```
g++ --std=c++17 my_gtirb_program.cpp -lgtirb
```


================================================
FILE: LICENSE.txt
================================================
==============================================================================
GTIRB is under the MIT License:
==============================================================================

MIT License

Copyright (c) 2018 GrammaTech, Inc.

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the "Software"), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in all
copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
SOFTWARE.

==============================================================================
Software from third parties included in GTIRB:
==============================================================================

GTIRB contains third party software which is under different license terms.
All such code will be identified clearly using at least one of two mechanisms:

1) It will be in a separate directory tree with its own `LICENSE.txt` or
   `LICENSE` file at the top containing the specific license and restrictions
   which apply to that software, or
2) It will contain specific license and restriction terms at the top of every
   file.

==============================================================================
Apache License v2.0 with LLVM Exceptions:
==============================================================================

                                 Apache License
                           Version 2.0, January 2004
                        http://www.apache.org/licenses/

    TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION

    1. Definitions.

      "License" shall mean the terms and conditions for use, reproduction,
      and distribution as defined by Sections 1 through 9 of this document.

      "Licensor" shall mean the copyright owner or entity authorized by
      the copyright owner that is granting the License.

      "Legal Entity" shall mean the union of the acting entity and all
      other entities that control, are controlled by, or are under common
      control with that entity. For the purposes of this definition,
      "control" means (i) the power, direct or indirect, to cause the
      direction or management of such entity, whether by contract or
      otherwise, or (ii) ownership of fifty percent (50%) or more of the
      outstanding shares, or (iii) beneficial ownership of such entity.

      "You" (or "Your") shall mean an individual or Legal Entity
      exercising permissions granted by this License.

      "Source" form shall mean the preferred form for making modifications,
      including but not limited to software source code, documentation
      source, and configuration files.

      "Object" form shall mean any form resulting from mechanical
      transformation or translation of a Source form, including but
      not limited to compiled object code, generated documentation,
      and conversions to other media types.

      "Work" shall mean the work of authorship, whether in Source or
      Object form, made available under the License, as indicated by a
      copyright notice that is included in or attached to the work
      (an example is provided in the Appendix below).

      "Derivative Works" shall mean any work, whether in Source or Object
      form, that is based on (or derived from) the Work and for which the
      editorial revisions, annotations, elaborations, or other modifications
      represent, as a whole, an original work of authorship. For the purposes
      of this License, Derivative Works shall not include works that remain
      separable from, or merely link (or bind by name) to the interfaces of,
      the Work and Derivative Works thereof.

      "Contribution" shall mean any work of authorship, including
      the original version of the Work and any modifications or additions
      to that Work or Derivative Works thereof, that is intentionally
      submitted to Licensor for inclusion in the Work by the copyright owner
      or by an individual or Legal Entity authorized to submit on behalf of
      the copyright owner. For the purposes of this definition, "submitted"
      means any form of electronic, verbal, or written communication sent
      to the Licensor or its representatives, including but not limited to
      communication on electronic mailing lists, source code control systems,
      and issue tracking systems that are managed by, or on behalf of, the
      Licensor for the purpose of discussing and improving the Work, but
      excluding communication that is conspicuously marked or otherwise
      designated in writing by the copyright owner as "Not a Contribution."

      "Contributor" shall mean Licensor and any individual or Legal Entity
      on behalf of whom a Contribution has been received by Licensor and
      subsequently incorporated within the Work.

    2. Grant of Copyright License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      copyright license to reproduce, prepare Derivative Works of,
      publicly display, publicly perform, sublicense, and distribute the
      Work and such Derivative Works in Source or Object form.

    3. Grant of Patent License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      (except as stated in this section) patent license to make, have made,
      use, offer to sell, sell, import, and otherwise transfer the Work,
      where such license applies only to those patent claims licensable
      by such Contributor that are necessarily infringed by their
      Contribution(s) alone or by combination of their Contribution(s)
      with the Work to which such Contribution(s) was submitted. If You
      institute patent litigation against any entity (including a
      cross-claim or counterclaim in a lawsuit) alleging that the Work
      or a Contribution incorporated within the Work constitutes direct
      or contributory patent infringement, then any patent licenses
      granted to You under this License for that Work shall terminate
      as of the date such litigation is filed.

    4. Redistribution. You may reproduce and distribute copies of the
      Work or Derivative Works thereof in any medium, with or without
      modifications, and in Source or Object form, provided that You
      meet the following conditions:

      (a) You must give any other recipients of the Work or
          Derivative Works a copy of this License; and

      (b) You must cause any modified files to carry prominent notices
          stating that You changed the files; and

      (c) You must retain, in the Source form of any Derivative Works
          that You distribute, all copyright, patent, trademark, and
          attribution notices from the Source form of the Work,
          excluding those notices that do not pertain to any part of
          the Derivative Works; and

      (d) If the Work includes a "NOTICE" text file as part of its
          distribution, then any Derivative Works that You distribute must
          include a readable copy of the attribution notices contained
          within such NOTICE file, excluding those notices that do not
          pertain to any part of the Derivative Works, in at least one
          of the following places: within a NOTICE text file distributed
          as part of the Derivative Works; within the Source form or
          documentation, if provided along with the Derivative Works; or,
          within a display generated by the Derivative Works, if and
          wherever such third-party notices normally appear. The contents
          of the NOTICE file are for informational purposes only and
          do not modify the License. You may add Your own attribution
          notices within Derivative Works that You distribute, alongside
          or as an addendum to the NOTICE text from the Work, provided
          that such additional attribution notices cannot be construed
          as modifying the License.

      You may add Your own copyright statement to Your modifications and
      may provide additional or different license terms and conditions
      for use, reproduction, or distribution of Your modifications, or
      for any such Derivative Works as a whole, provided Your use,
      reproduction, and distribution of the Work otherwise complies with
      the conditions stated in this License.

    5. Submission of Contributions. Unless You explicitly state otherwise,
      any Contribution intentionally submitted for inclusion in the Work
      by You to the Licensor shall be under the terms and conditions of
      this License, without any additional terms or conditions.
      Notwithstanding the above, nothing herein shall supersede or modify
      the terms of any separate license agreement you may have executed
      with Licensor regarding such Contributions.

    6. Trademarks. This License does not grant permission to use the trade
      names, trademarks, service marks, or product names of the Licensor,
      except as required for reasonable and customary use in describing the
      origin of the Work and reproducing the content of the NOTICE file.

    7. Disclaimer of Warranty. Unless required by applicable law or
      agreed to in writing, Licensor provides the Work (and each
      Contributor provides its Contributions) on an "AS IS" BASIS,
      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
      implied, including, without limitation, any warranties or conditions
      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
      PARTICULAR PURPOSE. You are solely responsible for determining the
      appropriateness of using or redistributing the Work and assume any
      risks associated with Your exercise of permissions under this License.

    8. Limitation of Liability. In no event and under no legal theory,
      whether in tort (including negligence), contract, or otherwise,
      unless required by applicable law (such as deliberate and grossly
      negligent acts) or agreed to in writing, shall any Contributor be
      liable to You for damages, including any direct, indirect, special,
      incidental, or consequential damages of any character arising as a
      result of this License or out of the use or inability to use the
      Work (including but not limited to damages for loss of goodwill,
      work stoppage, computer failure or malfunction, or any and all
      other commercial damages or losses), even if such Contributor
      has been advised of the possibility of such damages.

    9. Accepting Warranty or Additional Liability. While redistributing
      the Work or Derivative Works thereof, You may choose to offer,
      and charge a fee for, acceptance of support, warranty, indemnity,
      or other liability obligations and/or rights consistent with this
      License. However, in accepting such obligations, You may act only
      on Your own behalf and on Your sole responsibility, not on behalf
      of any other Contributor, and only if You agree to indemnify,
      defend, and hold each Contributor harmless for any liability
      incurred by, or claims asserted against, such Contributor by reason
      of your accepting any such warranty or additional liability.

    END OF TERMS AND CONDITIONS

    APPENDIX: How to apply the Apache License to your work.

      To apply the Apache License to your work, attach the following
      boilerplate notice, with the fields enclosed by brackets "[]"
      replaced with your own identifying information. (Don't include
      the brackets!)  The text should be enclosed in the appropriate
      comment syntax for the file format. We also recommend that a
      file or class name and description of purpose be included on the
      same "printed page" as the copyright notice for easier
      identification within third-party archives.

    Copyright [yyyy] [name of copyright owner]

    Licensed under the Apache License, Version 2.0 (the "License");
    you may not use this file except in compliance with the License.
    You may obtain a copy of the License at

       http://www.apache.org/licenses/LICENSE-2.0

    Unless required by applicable law or agreed to in writing, software
    distributed under the License is distributed on an "AS IS" BASIS,
    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
    See the License for the specific language governing permissions and
    limitations under the License.


---- LLVM Exceptions to the Apache 2.0 License ----

As an exception, if, as a result of your compiling your source code, portions
of this Software are embedded into an Object form of such source code, you
may redistribute such embedded portions in such Object form without complying
with the conditions of Sections 4(a), 4(b) and 4(d) of the License.

In addition, if you combine or link compiled forms of this Software with
software that is licensed under the GPLv2 ("Combined Software") and if a
court of competent jurisdiction determines that the patent provision (Section
3), the indemnity provision (Section 9) or other Section of the License
conflicts with the conditions of the GPLv2, you may retroactively and
prospectively choose to deem waived or otherwise exclude such Section(s) of
the License, but only in their entirety and only with respect to the Combined
Software.

==============================================================================
University of Illinois Open Source License:
==============================================================================
University of Illinois/NCSA
Open Source License

Copyright (c) 2003-2019 University of Illinois at Urbana-Champaign.
All rights reserved.

Developed by:

    LLVM Team

    University of Illinois at Urbana-Champaign

    http://llvm.org

Permission is hereby granted, free of charge, to any person obtaining a copy of
this software and associated documentation files (the "Software"), to deal with
the Software without restriction, including without limitation the rights to
use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies
of the Software, and to permit persons to whom the Software is furnished to do
so, subject to the following conditions:

    * Redistributions of source code must retain the above copyright notice,
      this list of conditions and the following disclaimers.

    * Redistributions in binary form must reproduce the above copyright notice,
      this list of conditions and the following disclaimers in the
      documentation and/or other materials provided with the distribution.

    * Neither the names of the LLVM Team, University of Illinois at
      Urbana-Champaign, nor the names of its contributors may be used to
      endorse or promote products derived from this Software without specific
      prior written permission.

THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS
FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
CONTRIBUTORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS WITH THE
SOFTWARE.


================================================
FILE: Macros.cmake
================================================
macro(IMPL_GTIRB_ADD_LINKER_FLAG flag)
  if(NOT ${CMAKE_EXE_LINKER_FLAGS} MATCHES "(${flag}.*)")
    set(CMAKE_EXE_LINKER_FLAGS
        "${CMAKE_EXE_LINKER_FLAGS} ${flag}"
        CACHE STRING "Linker Flags" FORCE
    )
  endif()

  if(NOT ${CMAKE_SHARED_LINKER_FLAGS} MATCHES "(${flag}.*)")
    set(CMAKE_SHARED_LINKER_FLAGS
        "${CMAKE_SHARED_LINKER_FLAGS} ${flag}"
        CACHE STRING "Linker Flags" FORCE
    )
  endif()
endmacro()

macro(GTIRB_ADD_MSVC_LINKER_FLAG flag)
  if(MSVC)
    impl_gtirb_add_linker_flag(${flag})
  endif()
endmacro()

macro(GTIRB_ADD_GCC_LINKER_FLAG flag)
  if(CMAKE_COMPILER_IS_GNUCXX)
    impl_gtirb_add_linker_flag(${flag})
  endif()
endmacro()

macro(GTIRB_ADD_CLANG_LINKER_FLAG flag)
  if(${CMAKE_CXX_COMPILER_ID} STREQUAL Clang)
    impl_gtirb_add_linker_flag(${flag})
  endif()
endmacro()

macro(GTIRB_ADD_LIBRARY)
  add_library(
    ${PROJECT_NAME} ${${PROJECT_NAME}_H} ${${PROJECT_NAME}_SRC}
                    ${${PROJECT_NAME}_PROTO}
  )

  set_target_properties(${PROJECT_NAME} PROPERTIES FOLDER "gtirb")
endmacro()

macro(GTIRB_ADD_LIBRARY_STATIC)
  add_library(
    ${PROJECT_NAME} STATIC ${${PROJECT_NAME}_H} ${${PROJECT_NAME}_SRC}
  )

  set_target_properties(${PROJECT_NAME} PROPERTIES FOLDER "gtirb")
endmacro()

macro(GTIRB_ADD_LIBRARY_HEADERONLY)
  add_library(${PROJECT_NAME} INTERFACE)
  target_include_directories(
    ${PROJECT_NAME} INTERFACE ${CMAKE_CURRENT_SOURCE_DIR}
  )
endmacro()

macro(GTIRB_ADD_EXECUTABLE)
  add_executable(${PROJECT_NAME} ${${PROJECT_NAME}_H} ${${PROJECT_NAME}_SRC})
  set_target_properties(${PROJECT_NAME} PROPERTIES FOLDER "gtirb/applications")
endmacro()

macro(GTIRB_ADD_EXECUTABLE_GTEST)
  add_executable(${PROJECT_NAME} ${${PROJECT_NAME}_H} ${${PROJECT_NAME}_SRC})

  add_test(NAME ${PROJECT_NAME} COMMAND ${PROJECT_NAME})
  set_target_properties(${PROJECT_NAME} PROPERTIES FOLDER "gtirb/test")
endmacro()

macro(GTIRB_GET_ALL_SUBDIRS result curdir)
  file(
    GLOB children
    RELATIVE ${curdir}
    ${curdir}/*
  )
  set(dirlist "")
  foreach(child ${children})
    if(IS_DIRECTORY ${curdir}/${child})
      list(APPEND dirlist ${child})
    endif()
  endforeach()
  set(${result} ${dirlist})
endmacro()

macro(GTIRB_ADD_ALL_SUBDIRS)
  gtirb_get_all_subdirs(SUBDIRS ${CMAKE_CURRENT_SOURCE_DIR})
  foreach(subdir ${SUBDIRS})
    add_subdirectory(${subdir})
  endforeach()
endmacro()

# Provide a vaguely consistent interface to find a Python 3 interpreter. Just
# use FindPython3 if it exists, but fall back to looking for the interpreter
# program if we have to.
if(${CMAKE_VERSION} VERSION_GREATER_EQUAL "3.12")
  macro(GTIRB_FIND_PYTHON)
    find_package(Python3 REQUIRED COMPONENTS Interpreter)
    if(Python3_EXECUTABLE)
      set(PYTHON ${Python3_EXECUTABLE})
    endif()
  endmacro()
else()
  macro(GTIRB_FIND_PYTHON)
    find_program(PYTHON NAMES python3 python py)
    if(PYTHON)
      execute_process(
        COMMAND "${PYTHON}" --version OUTPUT_VARIABLE Python3_VERSION
      )
      string(REPLACE "Python " "" Python3_VERSION "${Python3_VERSION}")
      if("${Python3_VERSION}" VERSION_LESS 3)
        unset(PYTHON)
        unset(Python3_VERSION)
      endif()
    endif()
  endmacro()
endif()


================================================
FILE: PROTOBUF.md
================================================
Using Serialized GTIRB Data
===========================

> Note that for language with GTIRB APIs (at least C++, Python, Common
> Lisp) using the GTIRB API is preferrable to manipulating protobuf
> directly.

GTIRB uses a serialized format that consists of an 8-byte signature
followed by serialized [protobuf](https://github.com/google/protobuf/wiki)
data. The protobuf data allows for exploration and manipulation in the
language of your choice.
The [Google protocol buffers](https://developers.google.com/protocol-buffers/)
homepage lists the languages in which protocol buffers can be used directly;
users of other languages can convert the protobuf-formatted data to
JSON format and then use the JSON data in their applications. In the
future we intend to define a standard JSON schema for GTIRB.

The 8-byte signature that prefixes the protobuf data includes both
GTIRB's magic number and the version fot GTIRB's protobuf specification
that is in use. The layout is as follows:

 - Bytes 0-4 contain the ASCII characters: `GTIRB`.
 - Bytes 5-6 are considered reserved for future use and should be 0.
 - Byte 7 contains the GTIRB protobuf spec version in use.

Directory `gtirb/src/proto` contains the protocol buffer message type
definitions for GTIRB. You can inspect these `.proto` files to
determine the structure of the various GTIRB message types. The
top-level message type is `IR`.


- [General Guidelines](#general-guidelines)
- [Python Applications](#python-applications)
- [Java Applications](#java-applications)


# General Guidelines

If you have not used protocol buffers before, there are several useful
resources available at
https://developers.google.com/protocol-buffers/, including an
installation guide and a tutorial.

In general, writing an application to use GTIRB data in protocol
buffer format will involve the following steps.

1. Install the protocol buffer compiler (`protoc`) from
   https://github.com/protocolbuffers/protobuf/releases, if you
   haven't already done so.

2. Install any required protocol buffer library or libraries for the
   programming language you are using.

3. Invoke the protocol buffer compiler on the `.proto` files in
   `gtirb/src/proto/` to generate code in the language you wish to use.

4. Write your application, importing/including the file or files you
   generated in step 3.

The [Protocol Buffers API
Reference](https://developers.google.com/protocol-buffers/docs/reference/overview)
provides language-specific instructions for the various supported
programming languages, along with links to information for cases where
support is provided by third-party plug-ins.


# Python Applications

To create a Python application that uses serialized GTIRB data, do the
following.

1. Install the protocol buffer compiler (`protoc`).

2. Install the Python protobuf library, if you haven't already done so.

       $ pip install protobuf

3. Generate Python message definitions in a dedicated directory (for
   example, `python/`).

       $ mkdir -p python
       $ for f in src/proto/*.proto; do
            protoc -Isrc/proto --python_out=python $f
         done

   This will create a number of files with names of the form
   `<bn>_pb2.py` in the `python/` subdirectory of your working
   directory: one for each `<bn>.proto` in src/proto/, including
   `IR_pb2.py`.

4. Write your application. Make sure that it imports `IR_pb2`, or the
   parts of it that you require.

5. Run your application, making sure that the directory containing
   your message definitions is in the `PYTHONPATH`.

## Python Examples

Directory `gtirb/doc/examples` contains several example Python scripts
that use protocol buffers to explore serialized GTIRB data.
- [cfg-paths.py](doc/examples/cfg-paths.py)
- [data-symbols.py](doc/examples/data-symbols.py)


# Java Applications


To create a Java application that uses serialized GTIRB data, do the
following.

1. Install the protocol buffer compiler (`protoc`).

2. Download the `protobuf` Java runtime from
   [https://mvnrepository.com/artifact/com.google.protobuf/protobuf-java](https://mvnrepository.com/artifact/com.google.protobuf/protobuf-java)
   and save it somewhere suitable.

3. Generate Java message definitions in a dedicated directory (for example,
   `java/`).

       $ mkdir -p java
       $ for f in src/proto/*.proto; do
            protoc -Isrc/proto --java_out=java $f
         done

   This will create a subdirectory `java/proto/', containing a number
   of files with names of the form `<bn>OuterClass.java`: one for each
   `<bn>.proto` in `src/proto/`.

4. Compile the Java message definitions, making sure the `protobuf`
   Java runtime `.jar` file is in your `CLASSPATH`.

     $ mkdir -p java/classfiles
     $ CLASSPATH=<path/to/protobuf_jar> \
       javac -d java/classfiles java/proto/*.java

   (If you want to build a `.jar` file to combine all these
   `.class` files, do so at this stage.)

5. Write your application. Make sure that it imports all the classes
   you need from the `proto` package.

6. Compile and run your application, making sure that your CLASSPATH
   contains both the `protobuf` Java runtime `.jar` file and the
   location of the your compiled message definition classes.


## Java Examples

Directory `gtirb/doc/examples` contains several example Java programs
that use protocol buffers to explore serialized GTIRB data.

- [datasymbols.java](doc/examples/datasymbols.java)


================================================
FILE: README.md
================================================
# GTIRB

The GrammaTech Intermediate Representation for Binaries (GTIRB) is a
machine code analysis and rewriting data structure.  It is intended to
facilitate the communication of binary IR between programs performing
binary disassembly, analysis, transformation, and pretty printing.
GTIRB is modeled on LLVM-IR, and seeks to serve a similar
functionality of encouraging communication and interoperability
between tools.

The remainder of this file describes various aspects of GTIRB:
- [Structure](#structure)
- [Installing](#installing)
- [Building](#building)
- [Usage](#usage)

# Structure

GTIRB has the following structure.  Solid lines denote inheritance.
Dotted lines denote reference by UUID.

![GTIRB Data Structure](.gtirb.svg)

## IR

An instance of GTIRB may include multiple modules (`Module`) which
represent loadable objects such as executables or libraries, an
inter-procedural control flow graph (`IPCFG`), and Auxiliary Data tables
(`AuxData`) which can hold arbitrary analysis results in user-defined
formats which can easily reference other elements of the IR.  Each
module holds information such as symbols (`Symbol`) and sections which
themselves hold the actual bytes and data and code blocks of the
module.  The CFG consists of basic blocks (`Block`) and control flow
edges between these blocks.  Each data or code block references a
range of bytes in a byte interval (`ByteInterval`).  A section may
hold one large byte interval holding all blocks---if the relative
positions of blocks in that section are defined---or may hold one byte
interval per block---if the relative positions of blocks is not
defined, e.g. for the code blocks in the `.text` section during
program rewriting.  Each symbol holds a pointer to the block or datum
it references.


## Instructions

GTIRB explicitly does NOT represent instructions or instruction
semantics but does provide symbolic operand information and access to
the bytes.  There are many *intermediate languages* (IL)s for
representation of instruction semantics (e.g., [BAP][]'s [BIL][],
[Angr][]'s [Vex][], or [Ghidra][]'s P-code).  GTIRB works with these
or any other IL by storing instructions generally and efficiently as
*raw machine-code bytes* and separately storing the symbolic and
control flow information.  The popular [Capstone][]/[Keystone][]
decoder/encoder provide an excellent option to read and write
instructions from/to GTIRB's machine-code byte representation without
committing to any particular semantic IL.  By supporting multiple ILs
and separate storage of analysis results in auxiliary data tables
GTIRB enables collaboration between independent binary analysis and
rewriting teams and tools.

[BAP]: https://github.com/BinaryAnalysisPlatform/bap
[BIL]: https://github.com/BinaryAnalysisPlatform/bil/releases/download/v0.1/bil.pdf
[Angr]: http://angr.io
[Vex]: https://github.com/angr/pyvex
[Ghidra]: https://www.nsa.gov/resources/everyone/ghidra/
[Capstone]: https://www.capstone-engine.org
[Keystone]: https://www.keystone-engine.org


## Auxiliary Data

GTIRB provides for the sharing of additional information,
e.g. analysis results, in the form of `AuxData` objects.  These can
store maps and vectors of basic GTIRB types in a portable way. The
[GTIRB manual][] describes the structure for common types of auxiliary
data such as function boundary information, type information, or
results of common analyses in [Standard AuxData Schemata][].

[GTIRB manual]: https://grammatech.github.io/gtirb/
[Standard AuxData Schemata]: https://grammatech.github.io/gtirb/md__aux_data.html


## UUIDs

Every element of GTIRB---e.g., modules (`Module`), symbols (`Symbol`),
and blocks (`Block`)---has a universally unique identifier (UUID).
UUIDs allow both first-class IR components and AuxData tables to
reference elements of the IR.

Instructions and symbolic operands can be addressed by the class
`Offset` which encapsulates a UUID (that refers to the instruction's
block) and an offset.


# Installing

Packages currently exist for easily installing GTIRB (and attendant
tooling including the [ddisasm][] disassembler and [gtirb-pprinter][]
pretty printer) on Windows, and Ubuntu 20. See below for
instructions. Additionally, a public Docker image exists at
[grammatech/ddisasm][] with all of these tools installed. GTIRB is
versioned with Major.Minor.Patch versioning where Major version
increments will require significant source changes but should be very
rare, Minor version increments may require small source changes, and
Patch version increments shouldn't break any downstream builds. We do
not yet provide ABI compatibility across any version changes.

[ddisasm]: https://github.com/GrammaTech/ddisasm
[gtirb-pprinter]: https://github.com/GrammaTech/gtirb-pprinter
[grammatech/ddisasm]: https://hub.docker.com/r/grammatech/ddisasm


## Python API

The latest stable GTIRB Python API may be installed from PyPI using pip:

```sh
pip install gtirb
```

The latest unstable version of the Python API can be installed from a
prebuilt wheel:

```sh
pip install https://download.grammatech.com/gtirb/files/python/gtirb-0.dev-py3-none-any.whl
```

It is critical that the choice of a `stable` or `unstable` package matches the
installed ddisasm and gtirb-pprinter packages.

## Windows

Windows releases are packaged as .zip files and are available at
https://download.grammatech.com/gtirb/files/windows-release/.

## Ubuntu

Packages for Ubuntu 20 are available in the GTIRB apt repository and may
be installed per the following instructions.

First, add GrammaTech's APT key.
```sh
wget -O - https://download.grammatech.com/gtirb/files/apt-repo/conf/apt.gpg.key | apt-key add -
```

Next update your sources.list file.
```sh
echo "deb [arch=amd64] https://download.grammatech.com/gtirb/files/apt-repo [distribution] [component]"| sudo tee -a /etc/apt/sources.list
```
Where:
- `[distribution]` is `focal` (currently, only Ubuntu 20 packages are available)
- `[component]` is either `stable`, which holds the last versioned release, or
`unstable`, which holds the HEAD of the repository.

Finally update your package database and install the core GTIRB tools:
```sh
sudo apt-get update
sudo apt-get install gtirb-pprinter ddisasm
```

**Warning**:  Stable versions gtirb-2.0.0, gtirb-pprinter-2.1.0, ddisasm-1.8.0
and OLDER rely on metapackages which cause conflicts if you try `apt-get upgrade`
(see https://github.com/GrammaTech/gtirb/issues/63).  In this case,
uninstall and reinstall the packages you got from the GTIRB repository.  You
may need to use `dpkg --remove` to remove the metapackages (e.g. `ddisasm`)
before removing the concrete versioned packages (e.g. `ddisasm-1.5.1`).
NEWER stable versions no longer rely on metapackages and can be upgraded
without problems.

# Building

GTIRB's C++ API should successfully build in 64-bits with GCC, Clang,
and Visual Studio compilers supporting at least C++17.  GTIRB uses
CMake which must be installed with at least version 3.10.

The common build process looks like this:
```sh
mkdir build
cd build
# Note: You may wish to add some -D arguments to the next command. See below.
cmake <path/to/gtirb>
cmake --build .
# Run the test suite.
ctest
```

For customizing the GTIRB build, you can get a list of customization options by
navigating to your build directory and running:

```sh
cmake -LH
```

## Requirements

To build and install GTIRB, the following requirements should be installed:

- [CMake][], version 3.10.0 or higher.
   - Ubuntu 18 provides this version via the APT package `cmake`.
   - Ubuntu 16 and earlier provide out of date versions; build from
     source on those versions.
- [Protobuf][], version
  3.0.0 or later.
  - Ubuntu 18 provides this version via the APT packages
    `libprotobuf-dev` and `protobuf-compiler`.
  - Ubuntu 16 and earlier provide out of date versions; build from
    source on those versions.
- Boost [(non-standard Ubuntu package from launchpad.net)][], version 1.68 or later.
  - Ubuntu 18 only has version 1.65 in the standard repository.  See Ubuntu instructions above.

[CMake]: https://cmake.org/
[Protobuf]: https://developers.google.com/protocol-buffers/
[(non-standard Ubuntu package from launchpad.net)]: https://launchpad.net/~mhier/+archive/ubuntu/libboost-latest


# Usage

GTIRB is designed to be serialized using [Google protocol buffers][]
(i.e., [protobuf][]), enabling [easy and efficient use from any
programming language](#using-serialized-gtirb-data).

GTIRB may also be used through a dedicated API implemented in multiple
languages. The APIs provide efficient data structures suitable for use
by binary analysis and rewriting applications; see
[below](#gtirb-api-implementations) for details.

[Google protocol buffers]: https://developers.google.com/protocol-buffers/
[protobuf]: https://github.com/google/protobuf/wiki


## Using Serialized GTIRB Data

GTIRB uses a serialized format that consists of an 8-byte signature
followed by serialized [protobuf][] data. The protobuf data allows
for exploration and manipulation in the language of your choice.
The [Google protocol buffers][] homepage lists the languages in which
protocol buffers can be used directly; users of other languages can
convert the protobuf-formatted data to JSON format and then use the
JSON data in their applications.

The `proto` directory in this repository contains the protocol buffer
message type definitions for GTIRB. You can inspect these `.proto`
files to determine the structure of the various GTIRB message
types. The top-level message type is `IR`.

For more details, see [Using Serialized GTIRB Data](PROTOBUF.md).


## GTIRB API Implementations

The GTIRB API is currently available in C++, Python, and Common Lisp.
There is a *partial* Java API which is not ready for external use.
For language-independent API information, see [GTIRB
Components](doc/general/ComponentsIndex.md). For information about the
different API implementations, see:

  - [C++ API](doc/cpp/README.md)
  - [Python API](python/README.md)
  - [Common Lisp API](cl/README.md)
  - Java API **incomplete**


================================================
FILE: cl/CMakeLists.txt
================================================
file(GLOB CL_SOURCES ${CMAKE_CURRENT_SOURCE_DIR}/*.lisp
     ${CMAKE_CURRENT_SOURCE_DIR}/*.asd
)

set(CL_EXECUTABLE_STEMS dot update)

foreach(CL_EXECUTABLE_STEM ${CL_EXECUTABLE_STEMS})
  set(CL_EXECUTABLE ${CMAKE_CURRENT_BINARY_DIR}/gtirb-${CL_EXECUTABLE_STEM})
  list(APPEND CL_EXECUTABLES ${CL_EXECUTABLE})

  add_custom_command(
    OUTPUT ${CL_EXECUTABLE}
    DEPENDS ${CL_SOURCES} ${PROTO_FILES}
    WORKING_DIRECTORY ${CMAKE_CURRENT_SOURCE_DIR}
    COMMAND
      ${LISP} --noinform --dynamic-space-size 16384 --no-userinit --no-sysinit
      --disable-debugger --load ${QUICKLISP}/setup.lisp --eval
      "(asdf:initialize-source-registry `(:source-registry (:tree \"${CMAKE_CURRENT_SOURCE_DIR}\") :inherit-configuration))"
      --eval "(ql:quickload :gtirb/${CL_EXECUTABLE_STEM})" --eval
      "(setf uiop/image::*lisp-interaction* nil)" --eval
      "(asdf:make :gtirb/run-${CL_EXECUTABLE_STEM} :type :program :monolithic t)"
      --eval "(uiop/image:quit)"
    COMMAND ${CMAKE_COMMAND} -E copy gtirb-${CL_EXECUTABLE_STEM}
            ${CMAKE_CURRENT_BINARY_DIR}
    COMMAND ${CMAKE_COMMAND} -E remove gtirb-${CL_EXECUTABLE_STEM}
    VERBATIM
  )
endforeach(CL_EXECUTABLE_STEM)

add_custom_target(clgtirb ALL DEPENDS ${CL_EXECUTABLES})

if(GTIRB_ENABLE_TESTS)
  add_test(
    NAME testgtirbcl
    COMMAND
      ${LISP} --noinform --dynamic-space-size 16384 --no-userinit --no-sysinit
      --disable-debugger --load "${QUICKLISP}/setup.lisp" --eval
      "(asdf:initialize-source-registry `(:source-registry (:tree \"${CMAKE_CURRENT_SOURCE_DIR}\") :inherit-configuration))"
      --eval "(ql:quickload :gtirb/test)" --eval "(gtirb/test:batch-test)"
    WORKING_DIRECTORY "${CMAKE_CURRENT_SOURCE_DIR}/"
  )
endif()


================================================
FILE: cl/README.md
================================================
Common Lisp library for GTIRB
=============================

The Common Lisp API for GrammaTech's IR for Binaries (GTIRB).  GTIRB
is a data structure designed to support the analysis and rewriting of
binary executables.  There are a number of tools that produce, process
and consume GTIRB.  See the following for more information on GTIRB:
- [https://github.com/grammatech/gtirb](https://github.com/grammatech/gtirb) the main GTIRB source repository.
- [https://grammatech.github.io/gtirb/](https://grammatech.github.io/gtirb/) the GTIRB manual repository.
- [https://arxiv.org/abs/1907.02859](https://arxiv.org/abs/1907.02859) a white-paper describing the design goals of GTIRB.
- [https://github.com/grammatech/ddisasm](https://github.com/grammatech/ddisasm) a very high performance reassembleable disassembler producing GTIRB.
- [https://github.com/grammatech/gtirb-pprinter](https://github.com/grammatech/gtirb-pprinter) a pretty printer from GTIRB to assembler.

## Requirements and Installation
Hopefully, eventually, it will be possible to install everything by
(1) installing
[Protobuf](https://developers.google.com/protocol-buffers/), version
3.7.0 or later, and then (2) installing this Common Lisp GTIRB library
with QuickLisp `(ql:quickload :gtirb)`.

We're a ways away from that currently.  So after you've installed
Protobuf, you should clone and install the Common Lisp `PROTOBUF`
package manually according to the instructions at
[https://github.com/brown/protobuf](https://github.com/brown/protobuf)
ensuring that the `protoc-gen-lisp` executable has been built and is
on your path.  At that point you should be able to load the GTIRB
package.

## Usage
The Common Lisp API attempts to provide access to the underlying GTIRB
data-structure described above in idiomatic common lisp.  The main
Protobuf data structures are wrapped in CLOS objects.  All fields are
modifiable with `setf`.  Invariant are maintained automatically by the
API, e.g. using `:around` methods.

In some cases accessors are provided beyond the fields directly
present in the Protobuf.  For example, every GTIRB element has a UUID
(which supports referencing elements from AuxData tables).  The Common
Lisp API provides uniform access to any element through the `get-uuid`
method which operates similarly to `gethash` only it may be called on
any top-level GTIRB `IR` object (which itself maintains a hash of
every contained element by UUID).

The GTIRB CFG is represented as a graph using the Common Lisp graph
library from
[https://github.com/eschulte/graph](https://github.com/eschulte/graph).
This simple representation should promote easy exploration and
modification of the control flow graph, and the many graph analysis
functions defined in that library may be directly applied to the CFG.
Every node of the graph holds the UUID for a code block.

The bytes of any code and data block may be accessed by calling the
`bytes` method, which provides directly access to the bytes of the
block's `byte-interval`.

### Example Usage
See the test suite for a large number of basic usage examples.
However, the following gives a simple usage example.

1.  From the command-line.  Use the datalog disassembler `ddisasm` to
    disassemble the `ls` executable into a GTIRB instance.

        ddisasm --ir $(which ls) /tmp/ls.gtirb

2.  From the Common Lisp REPL.  Load the GTIRB API, and then load the
    GTIRB instance created in step (1) into a common lisp GTIRB object.

        (ql:quickload :gtirb)
        (use-package :gtirb)
        (defparameter ls (read-gtirb "/tmp/ls.gtirb"))

3.  At this point you can explore the CFG, perform analyses, or even
    modify the contents of the GTIRB object.  Results of analyses may
    be saved into new AuxData tables which become part of the GTIRB
    object for later use by other sessions or by other tools
    potentially written in other languages.

        ;; Do stuff with the GTIRB, maybe make changes.

4.  Finally, the resulting GTIRB object may be written back to the
    file system.

        (write-gtirb ls "/tmp/ls-modified.gtirb")

5.  At the command line.  A new executable may be created from the
    modified gtirb file using the `gtirb-pprinter`.

        gtirb-pprinter --ir /tmp/ls-modified.gtirb --binary /tmp/ls-modified


================================================
FILE: cl/dot.lisp
================================================
(defpackage :gtirb/dot
  (:use :common-lisp :alexandria :graph :graph/dot :gtirb
        :command-line-arguments
        :named-readtables :curry-compose-reader-macros)
  (:import-from :uiop :nest)
  (:import-from :uiop/image :quit)
  (:shadowing-import-from :proto-v0 :ir)
  (:shadowing-import-from :gtirb :symbol)
  (:export :to-dot :to-dot-file))
(in-package :gtirb/dot)
(in-readtable :curry-compose-reader-macros)

(defun dot-edge-label (graph edge)
  (let ((obj (edge-value graph edge)))
    (format nil "\"~a[~:[U~;C~]:~:[I~;D~]]\""
            (edge-type obj) (conditional obj) (direct obj))))

(defmethod to-dot ((obj gtirb) &rest rest)
  "Write the CFG of MODULE to the Graphviz graphing language."
  (apply #'to-dot (cfg obj)
         :edge-attrs (list (cons :label {dot-edge-label (cfg obj)}))
         rest))

(eval-when (:compile-toplevel :load-toplevel :execute)
  (defparameter +udpate-args+
    '((("help" #\h #\?) :type boolean :optional t
       :documentation "display help output"))))

;;; NOTE: When Quicklisp updates graph to the latest this can be removed.
(defmethod to-dot-file
    ((object t) path &key attributes node-attrs edge-attrs
                       subgraphs ranks)
  (with-open-file (out path :direction :output :if-exists :supersede)
    (to-dot object :stream out :attributes attributes :node-attrs node-attrs
            :edge-attrs edge-attrs :subgraphs subgraphs :ranks ranks)))

(define-command dot (gtirb-file dot-file &spec +udpate-args+)
  "Write first GTIRB module in GTIRB-FILE to DOT-FILE." ""
  (when help (show-help-for-dot) (quit))
  (to-dot-file (read-gtirb gtirb-file) dot-file))


================================================
FILE: cl/gtirb.asd
================================================
(defsystem "gtirb"
    :name "gtirb"
    :author "GrammaTech"
    :licence "MIT"
    :description "Common Lisp library for GTIRB"
    :long-description "A Common Lisp front end to the GrammaTech
  Intermediate Representation for Bianries (GTIRB).  GTIRB is
  serialized using Google's protocol buffers.  This library wraps the
  raw protocol buffer serialization with a more Lispy interface."
    :depends-on (:gtirb/gtirb)
    :class :package-inferred-system
    :defsystem-depends-on (:asdf-package-system :protobuf)
    :in-order-to ((test-op (load-op "gtirb/test")))
    :perform (test-op (o c) (symbol-call :gtirb/test '#:test)))

(defsystem "proto-v0"
    :name "proto-v0"
    :description "Common Lisp interface to (old V0) GTIRB protobuf files"
    :author "GrammaTech"
    :license "MIT"
    :defsystem-depends-on (:protobuf)
    :components
    ((:static-file "README.md")
     ;; See the protobuf defsystem extension for how the gtirb.proto
     ;; file is loaded into Lisp.  https://github.com/brown/protobuf
     (:module proto
              :pathname "../proto/v0/"
              :components
              ((:protobuf-source-file "AuxDataContainer")
               (:protobuf-source-file "CFG")
               (:protobuf-source-file "Section")
               (:protobuf-source-file "Offset")
               (:protobuf-source-file "IR")
               (:protobuf-source-file "ByteMap")
               (:protobuf-source-file "ProxyBlock")
               (:protobuf-source-file "AuxData")
               (:protobuf-source-file "Module")
               (:protobuf-source-file "DataObject")
               (:protobuf-source-file "ImageByteMap")
               (:protobuf-source-file "SymbolicExpression")
               (:protobuf-source-file "Symbol")
               (:protobuf-source-file "Block")))))

(defsystem "proto"
    :name "proto"
    :description "Common Lisp interface to GTIRB protobuf files"
    :author "GrammaTech"
    :license "MIT"
    :defsystem-depends-on (:protobuf)
    :components
    ((:static-file "README.md")
     ;; See the protobuf defsystem extension for how the gtirb.proto
     ;; file is loaded into Lisp.  https://github.com/brown/protobuf
     (:module proto
              :pathname "../proto"
              :components
              ((:protobuf-source-file "AuxData")
               (:protobuf-source-file "ByteInterval")
               (:protobuf-source-file "CFG")
               (:protobuf-source-file "CodeBlock")
               (:protobuf-source-file "Offset")
               (:protobuf-source-file "DataBlock")
               (:protobuf-source-file "IR")
               (:protobuf-source-file "Module")
               (:protobuf-source-file "ProxyBlock")
               (:protobuf-source-file "Section")
               (:protobuf-source-file "Symbol")
               (:protobuf-source-file "SymbolicExpression")))))

(defsystem "gtirb/run-validate"
    :author "GrammaTech"
    :licence "MIT"
    :description "Validate a GTIRB instance."
    :depends-on (gtirb/validate)
    :build-operation "asdf:program-op"
    :build-pathname "gtirb-validate"
    :entry-point "gtirb/validate::run-validate-file")

(defsystem "gtirb/run-update"
    :author "GrammaTech"
    :licence "MIT"
    :description "Convert between GTIRB protobuf versions."
    :depends-on (gtirb/update)
    :build-operation "asdf:program-op"
    :build-pathname "gtirb-update"
    :entry-point "gtirb/update::run-update")

(defsystem "gtirb/run-dot"
    :author "GrammaTech"
    :licence "MIT"
    :description "Write GTIRB to a dot graph."
    :depends-on (gtirb/dot)
    :build-operation "asdf:program-op"
    :build-pathname "gtirb-dot"
    :entry-point "gtirb/dot::run-dot")

(register-system-packages "proto" '(:gtirb.proto))
(register-system-packages "cl-interval" '(:interval))


================================================
FILE: cl/gtirb.lisp
================================================
(defpackage :gtirb/gtirb
  (:nicknames :gtirb)
  (:use :common-lisp :alexandria :cl-ppcre :graph :trivia
        :trivial-utf-8
        :ieee-floats
        :gtirb/ranged
        :gtirb/utility
        :gtirb/version
        :named-readtables :curry-compose-reader-macros)
  (:shadow :symbol)
  (:import-from :gtirb.proto)
  (:import-from :trivial-package-local-nicknames :add-package-local-nickname)
  (:import-from :uiop :nest)
  (:import-from :cl-intbytes
                :int->octets
                :octets->int
                :octets->uint)
  (:export :read-gtirb
           :write-gtirb
           :is-equal-p
           :*is-equal-p-verbose-p*
           :gtirb-node
           :get-uuid
           :remove-uuid
           :at-address
           :on-address
           :address-range
           :uuid
           :update-proto
;;; Classes and fields.
           :gtirb
           :ir
           :cfg
           :version
           ;; Module
           :module
           :name
           :binary-path
           :isa
           :file-format
           :byte-order
           :preferred-addr
           :rebase-delta
           :symbols
           :proxies
           :sections
           :aux-data
           :entry-point
           ;; Symbol
           :symbol
           :value
           :payload
           :at-end
           ;; Section
           :section
           :byte-intervals
           :flags
           ;; Byte-Interval
           :byte-interval
           :blocks
           :addressp
           :address
           :contents
           :size
           :truncate-contents
           :ignore
           ;; Symbolic expressions
           :symbolic-expressions
           :sym-addr-const
           :sym-addr-addr
           :scale
           :*preserve-symbolic-expressions*
           ;; Block
           :gtirb-block
           :gtirb-byte-block
           :code-block
           :data-block
           :decode-mode
           :bytes
           :offset
           ;; Edge-Label
           :edge-label
           :conditional
           :direct
           :edge-type
           ;; Aux-Data
           :aux-data-type
           :aux-data-data
           ;; gtirb
           :modules))
(in-package :gtirb/gtirb)
(in-readtable :curry-compose-reader-macros)

(eval-when (:compile-toplevel :load-toplevel :execute)
  (add-package-local-nickname :proto :gtirb.proto))

(defgeneric read-gtirb (source)
  (:documentation "Read a protobuf serialized GTIRB instance from SOURCE.")
  (:method ((path t))
    (make-instance 'gtirb :proto (read-proto 'proto:ir path))))

(defmethod read-gtirb :around (source)
  "Check the protobuf version."
  (let ((gtirb (call-next-method)))
    (unless (= protobuf-version (proto:version (proto gtirb)))
      (warn "Protobuf version mismatch version ~a from ~a isn't expected ~a"
            (proto:version (proto gtirb)) source protobuf-version))
    gtirb))

(defun write-gtirb (gtirb path)
  "Write a GTIRB IR object to PATH."
  (update-proto gtirb)
  (write-proto (proto gtirb) path))


;;;; Class utilities.
(defvar *is-equal-p-verbose-p* nil
  "Compare equality verbosely in the `is-equal-p' function.
This may be useful to print contextual information when an equality
comparison fails for a large object with many nested objects.")

(defvar *is-equal-p-verbose-output-buffer* nil
  "Buffer to hold output of is-equal-p verbose failure messages.")

(defvar *is-equal-p-verbose-output-length* 10
  "Maximum length of output to show of `*is-equal-p-verbose-output-buffer*'.")

(defmacro compare-or-verbose (comparison left right &rest flags)
  `(or (,comparison ,left ,right ,@flags)
       (prog1 nil
         (when *is-equal-p-verbose-p*
           (push (format nil "NOT ~S" (list ',comparison ,left ,right))
                 *is-equal-p-verbose-output-buffer*)))))

(defun is-equal-p (left right)
  "Return t if LEFT and RIGHT are equal.
Recursively descend into any sub-structure.  Custom recursive equality
predicates are defined for common Common Lisp data structures as well
as all GTIRB structures."
  (let ((*is-equal-p-verbose-output-buffer* nil))
    (let ((equalp (is-equal-p-internal left right)))
      (prog1 equalp
        (when (and (not equalp) *is-equal-p-verbose-p*)
          (format t "~{~S~%~}"
                  (subseq *is-equal-p-verbose-output-buffer*
                          0 *is-equal-p-verbose-output-length*)))))))

(defmethod is-equal-p-internal :around ((left t) (right t))
  (let ((equalp (call-next-method)))
    (when equalp (setf *is-equal-p-verbose-output-buffer* nil))
    equalp))

(defgeneric is-equal-p-internal (left right)
  (:documentation "Internal function called by `is-equal-p'.")
  (:method ((left t) (right t))
    (compare-or-verbose equalp left right))
  (:method ((left number) (right number))
    (compare-or-verbose = left right))
  (:method ((left cl:symbol) (right cl:symbol))
    (compare-or-verbose eql left right))
  (:method ((left string) (right string))
    (compare-or-verbose string= left right))
  (:method ((left cons) (right cons))
    (if (and (proper-list-p left) (proper-list-p right))
        (compare-or-verbose set-equal left right :test #'is-equal-p-internal)
        (and (compare-or-verbose is-equal-p-internal (car left) (car right))
             (compare-or-verbose is-equal-p-internal (cdr left) (cdr right)))))
  (:method ((left hash-table) (right hash-table))
    (compare-or-verbose set-equal
                        (hash-table-alist left) (hash-table-alist right)
                        :test #'is-equal-p-internal))
  (:method ((left graph:digraph) (right graph:digraph))
    (and (compare-or-verbose set-equal (graph:nodes left) (graph:nodes right)
                             :test #'is-equal-p-internal)
         (compare-or-verbose set-equal (graph:edges-w-values left)
                             (graph:edges-w-values right)
                             :test #'is-equal-p-internal))))

(defclass gtirb-node () ()
  (:documentation "Objects with a UUID contained in a GTIRB instance."))

(defclass proto-backed (gtirb-node) ()
  (:documentation "Objects which may be serialized to/from protobuf."))

(defgeneric uuid (object)
  (:documentation "Return the UUID for OBJECT as an integer.")
  (:method ((obj proto-backed)) (uuid-to-integer (proto:uuid (proto obj)))))

(defgeneric get-uuid (uuid object)
  (:documentation "Get the referent of UUID in OBJECT."))

(defgeneric remove-uuid (uuid object)
  (:documentation "Remove the entry for UUID from OBJECT."))

(defgeneric (setf get-uuid) (new uuid object)
  (:documentation "Register REFERENT behind UUID in OBJECT."))

(defgeneric insert-address (object item start-address &optional end-address)
  (:documentation
   "Insert ITEM into OBJECT between START-ADDRESS and END-ADDRESS."))

(defgeneric delete-address (object item start-address &optional end-address)
  (:documentation
   "Delete ITEM from OBJECT between START-ADDRESS and END-ADDRESS."))

(defgeneric at-address (object address)
  (:documentation
   "Find all objects in OBJECT starting at ADDRESS."))

(defgeneric on-address (object start-address &optional end-address)
  (:documentation
   "Find all objects in OBJECT between START-ADDRESS and END-ADDRESS."))

(defgeneric set-parent-uuid (new uuid object)
  (:documentation "Set UUID to NEW in OBJECT's parent."))

(defgeneric update-proto (proto-backed-object)
  (:documentation
   "Update and return the `proto' field of PROTO-BACKED-OBJECT.
This will ensure that any changes made to PROTO-BACKED-OBJECT outside
of its protocol buffer, e.g. any slots initialized using the
:from-proto option to `define-proto-backed-class', are synchronized
against the object's protocol buffer.")
  (:method ((proto-backed-object proto-backed))
    (proto proto-backed-object)))

(defgeneric address-range (proto-backed-object)
  (:documentation
   "Return any address range of the PROTO-BACKED-OBJECT GTIRB object."))

(defmacro define-proto-backed-class ((class proto-class) super-classes
                                     slot-specifiers proto-fields
                                     &rest options)
  "Define a Common Lisp class backed by a protobuf class.
SLOT-SPECIFIERS is as in `defclass' with the addition of optional
:to-proto and :from-proto fields, which may take protobuf
serialization functions, and :skip-equal-p field which causes
`is-equal-p' to skip that field.  PROTO-FIELDS may hold a list of
fields which pass through directly to the backing protobuf class.  The
:parent option names the field holding the containing protobuf
element.  The :address-range option holds the logic to calculate an
address range for instances of the object."
  (nest
   (flet ((plist-get (item list)
            (second (member item list)))
          (plist-drop (item list)
            (if-let ((location (position item list)))
              (append (subseq list 0 location)
                      (subseq list (+ 2 location)))
              list))))
   (let ((from-proto-slots (remove-if-not {find :from-proto} slot-specifiers))
         (to-proto-slots (remove-if-not {find :to-proto} slot-specifiers))
         (parent (second (assoc :parent options)))
         (address-range (cdr (assoc :address-range options)))))
   `(progn
      (defclass ,class (proto-backed ,@super-classes)
        ;; Accessors for normal lisp classes
        ((proto :initarg :proto :accessor proto :type ,proto-class
                :initform ,(if parent
                               `(let ((it (make-instance ',proto-class)))
                                  (setf (proto::uuid it) (new-uuid))
                                  it)
                               `(make-instance ',proto-class))
                :documentation "Backing protobuf object.
Should not need to be manipulated by client code.")
         (ir :accessor ir :type (or null gtirb)
             :initarg :ir
             :initform nil
             :documentation
             ,(format nil "Access the top-level IR of this ~a." class))
         ;; TODO: Consider throwing warnings in a `setf :around'
         ;;       defmethod on the parents of objects with parents if
         ;;       the objects are set to something that already has a
         ;;       current parent.  This could avoid surprising
         ;;       inconsistencies.  Alternately this could throw an
         ;;       error with the option to copy the object with a new
         ;;       corrected parent or to set the parent directly.
         ,@(when parent
             `((,parent :accessor ,parent :type (or null ,parent)
                        :initarg ,(make-keyword parent)
                        :initform nil
                        :documentation ,(format nil "Access the ~a of this ~a."
                                                parent class))))
         ,@(mapcar [{plist-drop :to-proto} {plist-drop :from-proto}
                    {plist-drop :proto-field} {plist-drop :skip-equal-p}]
                   slot-specifiers))
        ,@(remove-if [«or {eql :parent} {eql :address-range}» #'car] options))
      ,@(when parent
          `((defmethod get-uuid (uuid (object ,class))
              (assert (or (ir object) (,parent object)) (object)
                      ,(format nil
                               "`get-uuid' failed on a ~a without a ~a"
                               class parent))
              (get-uuid uuid (or (ir object) (,parent object))))
            (defmethod set-parent-uuid (new uuid (object ,class))
              (assert (or (ir object) (,parent object)) (object)
                      ,(format nil
                               "`set-parent-uuid' failed on a ~a without a ~a"
                               class parent))
              (setf (get-uuid uuid (or (ir object) (,parent object))) new))
            (defmethod (setf get-uuid) (new uuid (object ,class))
              (assert (or (ir object) (,parent object)) (object)
                      ,(format nil
                               "`get-uuid' failed on ~a without a ~a"
                               class parent))
              (set-parent-uuid new uuid object))
            (defmethod remove-uuid (uuid (object ,class))
              (assert (or (ir object) (,parent object)) (object)
                      ,(format nil
                               "`remove-uuid' failed on ~a without a ~a"
                               class parent))
              (remove-uuid uuid (or (ir object) (,parent object))))
            (defmethod at-address ((object ,class) address)
              (assert (or (ir object) (,parent object)) (object)
                      ,(format nil
                               "`at-address' failed on ~a without a ~a"
                               class parent))
              (at-address (or (ir object) (,parent object)) address))
            (defmethod on-address ((object ,class) start &optional end)
              (assert (or (ir object) (,parent object)) (object)
                      ,(format nil
                               "`on-address' failed on ~a without a ~a"
                               class parent))
              (on-address (or (ir object) (,parent object)) start end))))
      (defmethod address-range ((self ,class)) ,@address-range)
      (defmethod
          initialize-instance :after ((self ,class) &key)
          ,@(when parent
              `((when (,parent self)
                  (setf (get-uuid (uuid-to-integer (proto:uuid (proto self)))
                                  self)
                        self))))
          (with-slots (proto ,@(mapcar #'car from-proto-slots)) self
            ,@(mapcar
               (lambda (spec)
                 (destructuring-bind
                       (slot &key from-proto &allow-other-keys) spec
                   `(setf ,slot (funcall ,from-proto proto))))
               from-proto-slots)))
      (defmethod update-proto ((self ,class))
        ,@(mapcar
           (lambda (spec)
             (destructuring-bind
                   (slot &key to-proto (proto-field slot) &allow-other-keys)
                 spec
               `(setf (,(intern (symbol-name proto-field) 'proto) (proto self))
                      (funcall ,to-proto (,slot self)))))
           to-proto-slots)
        (proto self))
      ;; Equality check on class.
      ;;
      ;; NOTE: For this to work we might need to add an optional :only
      ;;       field to both slot-specifiers  and proto-fields.  This
      ;;       would mean that the equality of this field is only
      ;;       checked with this form returns true.  E.g., on
      ;;       byte-intervals we could say:
      ;;       (address :type unsigned-byte-64 :only #'addressp)
      (defmethod is-equal-p-internal ((left ,class) (right ,class))
        (and ,@(mapcar
                (lambda (accessor)
                  `(compare-or-verbose is-equal-p-internal
                                       (,accessor left) (,accessor right)))
                (append
                 (mapcar {plist-get :accessor}
                         (remove-if {plist-get :skip-equal-p}
                                    slot-specifiers))
                 (mapcar #'car proto-fields)))))
      ;; Pass-through accessors for protobuf fields so they operate
      ;; directly on the backing protobuf object.
      ,@(apply
         #'append
         (mapcar
          (nest
           (lambda (pair))
           (destructuring-bind
                 (name &key type documentation enumeration (proto-field name)
                       &allow-other-keys) pair)
           (let ((base `(,(intern (symbol-name proto-field) 'proto)
                          (proto obj)))))
           `((defmethod ,name ((obj ,class))
               ,@(when documentation (list documentation))
               ,(ecase type
                  ((unsigned-byte-64 boolean bytes) base)
                  (enumeration `(cdr (assoc ,base ,enumeration)))
                  (uuid `(uuid-to-integer ,base))
                  (string `(pb:string-value ,base))))
             (defmethod (setf ,name) (new (obj ,class))
               ,@(when documentation (list documentation))
               ,(ecase type
                  ((unsigned-byte-64 boolean) `(setf ,base new))
                  (bytes `(setf ,base (force-byte-array new)))
                  (enumeration `(setf ,base (car (rassoc new ,enumeration))))
                  (uuid `(setf ,base (integer-to-uuid new)))
                  (string `(setf ,base (pb:string-field new)))))))
          proto-fields)))))

(eval-when (:compile-toplevel :load-toplevel :execute)
  (defvar aux-data-slot-definition
    "A-list of auxiliary data objects keyed by string name.
Aux-Data tables may hold structured or unstructured data.  This data
may refer to elements of the GTIRB IR through uuids.  Information
relevant to a particular module will be stored in Aux-Data tables
accessible from the specific module.  Aux-Data tables only exist on
modules and on GTIRB IR instances."))


;;;; Classes.
(define-proto-backed-class (gtirb proto:ir) ()
    ((modules :initarg modules :accessor modules :type list
              :initform nil
              :from-proto
              [{mapcar {make-instance 'module :ir self :gtirb self :proto}}
               {coerce _ 'list} #'proto:modules]
              :to-proto {map 'vector #'update-proto}
              :documentation
              "List of the modules on a top-level GTIRB IR instance.")
     (cfg :accessor cfg :type digraph
          :from-proto
          (lambda (proto)
            (let ((p-cfg (proto:cfg proto)))
              (populate
               (make-instance 'digraph)
               :edges-w-values
               (mapcar
                (lambda (edge)
                  (cons (list (uuid-to-integer (proto:source-uuid edge))
                              (uuid-to-integer (proto:target-uuid edge)))
                        (make-instance 'edge-label :proto (proto:label edge))))
                (coerce (proto:edges p-cfg) 'list))
               :nodes (map 'list  #'uuid-to-integer (proto:vertices p-cfg)))))
          :to-proto
          (lambda (cfg &aux (p-cfg (make-instance 'proto:cfg)))
            (setf
             (proto:vertices p-cfg)
             (map 'vector #'integer-to-uuid (nodes cfg))
             (proto:edges p-cfg)
             (map 'vector
                  (lambda (edge)
                    (destructuring-bind ((source target) . label) edge
                      (let ((p-edge (make-instance 'proto:edge)))
                        (setf
                         (proto:source-uuid p-edge) (integer-to-uuid source)
                         (proto:target-uuid p-edge) (integer-to-uuid target)
                         (proto:label p-edge) (proto label))
                        p-edge)))
                  (edges-w-values cfg)))
            p-cfg)
          :documentation
          "Control flow graph (CFG) represented as a `graph:digraph'.
Nodes in the graph hold the UUIDs of code blocks which may be looked
up using `get-uuid'.  Edges on the graph are labeled with `edge-label'
objects which provide information on the nature of the control flow of
the graph.")
     (aux-data :accessor aux-data :type list
               :from-proto #'aux-data-from-proto
               :to-proto #'aux-data-to-proto
               :documentation #.aux-data-slot-definition)
     (by-uuid :accessor by-uuid :initform (make-hash-table) :type hash-table
              :skip-equal-p t
              :documentation "Internal cache for UUID-based lookup.")
     (by-address :accessor by-address :initform (make-ranged) :skip-equal-p t
                 :documentation "Internal cache for Address-based lookup.")
     (aux-data-w-offsets :accessor aux-data-w-offsets :initform nil
                         :skip-equal-p t
                         :documentation "Cache for fast offset updates."))
    ((version :type unsigned-byte-64 :documentation "Protobuf version."))
  (:documentation "Base class of an instance of GTIRB IR."))

(defmethod initialize-instance :around ((self gtirb) &key)
  (call-next-method)
  ;; Populate the aux-data tables with offsets.
  (setf (aux-data-w-offsets self) (get-aux-data-w-offsets self)))

(define-condition ir (error)
  ((message :initarg :message :initform nil :reader message)
   (object :initarg :object :initform nil :reader object))
  (:report (lambda (condition stream)
             (format stream "GTIRB error ~S on ~S."
                     (message condition) (object condition))))
  (:documentation "Condition raised on GTIRB data structure violations."))

(defmethod print-object ((obj gtirb) stream)
  (print-unreadable-object (obj stream :type t :identity t)
    (format stream "~a" (modules obj))))

(defmethod ir ((obj gtirb)) obj)

(defmethod get-uuid (uuid (obj gtirb))
  (gethash uuid (by-uuid obj)))

(defmethod (setf get-uuid) (new uuid (obj gtirb))
  (when (zerop uuid)
    (warn "Saving object ~a without a UUID into ~a." new obj))
  (when-let ((range (address-range new)))
    #+debug (format t "(range ~S) ;; => ~S~%" new range)
    (apply #'insert-address obj new range))
  (setf (gethash uuid (by-uuid obj)) new))

(defmethod remove-uuid (uuid (obj gtirb))
  (remhash uuid (by-uuid obj)))

(defmethod insert-address ((gtirb gtirb) item start &optional end)
  (ranged-insert (by-address gtirb) (uuid item) start end))

(defmethod delete-address ((gtirb gtirb) item start &optional end)
  (ranged-delete (by-address gtirb) (uuid item) start end))

(defmethod at-address ((gtirb gtirb) address)
  (mapcar {get-uuid _ gtirb} (ranged-find-at (by-address gtirb) address)))

(defmethod on-address ((gtirb gtirb) start &optional (end start))
  (mapcar {get-uuid _ gtirb} (ranged-find (by-address gtirb) start end)))

(define-constant +module-isa-map+
    '((#.proto:+isa-isa-undefined+ . :undefined)
      (#.proto:+isa-ia32+ . :ia32)
      (#.proto:+isa-ppc32+ . :ppc32)
      (#.proto:+isa-x64+ . :x64)
      (#.proto:+isa-arm+ . :arm)
      (#.proto:+isa-valid-but-unsupported+ . :valid-but-unsupported)
      (#.proto:+isa-ppc64+ . :ppc64)
      (#.proto:+isa-arm64+ . :arm64)
      (#.proto:+isa-mips32+ . :mips32)
      (#.proto:+isa-mips64+ . :mips64))
  :test #'equal)

(define-constant +module-file-format-map+
    '((#.proto:+file-format-coff+ . :coff)
      (#.proto:+file-format-elf+ . :elf)
      (#.proto:+file-format-ida-pro-db32+ . :ida-pro-db32)
      (#.proto:+file-format-ida-pro-db64+ . :ida-pro-db64)
      (#.proto:+file-format-macho+ . :macho)
      (#.proto:+file-format-pe+ . :pe)
      (#.proto:+file-format-raw+ . :raw)
      (#.proto:+file-format-xcoff+ . :xcoff)
      (#.proto:+file-format-format-undefined+ . :format-undefined))
  :test #'equal)

(define-constant +module-byte-order-map+
    `((#.proto:+byte-order-byte-order-undefined+ . :undefined)
      (#.proto:+byte-order-big-endian+ . :big-endian)
      (#.proto:+byte-order-little-endian+ . :little-endian))
  :test #'equal)

(define-proto-backed-class (module proto:module) ()
    ((proxies :accessor proxies :type hash-table
              :initform (make-hash-table)
              :from-proto
              (lambda (proto &aux (table (make-hash-table)))
                (let ((proto-proxies (proto:proxies proto)))
                  (dotimes (n (length proto-proxies) table)
                    (let ((it (aref proto-proxies n)))
                      (setf (gethash (uuid-to-integer (proto:uuid it)) table)
                            (make-instance 'proxy-block
                              :ir (ir self) :module self :proto it))))))
              :to-proto
              [{map 'vector (lambda (uuid)
                              (let ((it (make-instance 'proto:proxy-block)))
                                (setf (proto:uuid it) (integer-to-uuid uuid))
                                it))}
               {mapcar #'car} #'hash-table-alist]
              :documentation
              "Hash-table of proxy-blocks keyed by UUID.
Proxy-blocks in GTIRB are used to represent cross-module linkages.
For example when code in a module calls to a function defined in an
external library, the CFG for that IR instance may represent this call
with a call edge to a proxy block representing the external called
function.")
     (symbols :accessor symbols :type list
              :initform nil
              :from-proto
              [{map 'list
                    {make-instance 'symbol :ir (ir self) :module self :proto}}
               #'proto:symbols]
              :to-proto {map 'vector #'update-proto}
              :documentation "Hash-table of symbols keyed by UUID.")
     (sections :accessor sections :type list
               :from-proto
               [{map 'list
                     {make-instance 'section :ir (ir self) :module self :proto}}
                #'proto:sections]
               :to-proto {map 'vector #'update-proto}
               :documentation "List of the sections comprising this module.")
     (aux-data :accessor aux-data :type list
               :from-proto #'aux-data-from-proto
               :to-proto #'aux-data-to-proto
               :documentation #.aux-data-slot-definition))
    ((name :type string :documentation
           "An optional human-readable name for this module.")
     (binary-path :type string :documentation
                  "The path or filename for this module.
E.g, the name of a dynamically loaded library or of the main
executable.")
     (preferred-addr :type unsigned-byte-64 :documentation
                     "Some systems specify a preferred address in memory.
On those systems this field may be used to capture this address.")
     (rebase-delta :type unsigned-byte-64 :documentation
                   "The difference between this module's and
`preferred-addr' and the address at which it was actually loaded.")
     (isa :type enumeration :enumeration +module-isa-map+ :documentation
          "The instruction set architecture (ISA) of the code in this module.")
     (file-format :type enumeration :enumeration +module-file-format-map+
                  :documentation
                  "The binary file format of the original file this
module represents.")
     (byte-order :type enumeration :enumeration +module-byte-order-map+ :documentation
                 "The byte-order of the bytes in this module."))
  (:documentation "Module of a GTIRB IR instance.") (:parent gtirb))

(defmethod make-instance :around
    ((class (eql 'module)) &rest initargs &key &allow-other-keys)
  (let ((proto (or (getf initargs :proto)
                   (let ((new-proto (make-instance 'proto:module)))
                     (if-let ((name (getf initargs :name)))
                       (setf (proto:name new-proto) (pb:string-field name))
                       (warn "Modules created without a name"))
                     new-proto))))
    (apply #'call-next-method class :proto proto initargs)))

(defmethod print-object ((obj module) stream)
  (print-unreadable-object (obj stream :type t :identity t)
    (format stream "~a ~a ~s" (file-format obj) (isa obj) (name obj))))

(defgeneric get-aux-data-w-offsets (object)
  (:documentation "Collect all Aux-Data tables with offsets in their types.")
  (:method ((list list))
    (remove-if-not [{find :offset} #'flatten #'aux-data-type #'cdr] list))
  (:method ((self module)) (get-aux-data-w-offsets (aux-data self)))
  (:method ((self gtirb))
    (apply #'append
           (get-aux-data-w-offsets (aux-data self))
           (mapcar #'get-aux-data-w-offsets (modules self)))))

(defmethod (setf aux-data) :after (new-value (self gtirb))
  (declare (ignorable new-value))
  (setf (aux-data-w-offsets self) (get-aux-data-w-offsets self)))

(defmethod (setf aux-data) :after (new-value (self module))
  (declare (ignorable new-value))
  (setf (aux-data-w-offsets (ir self)) (get-aux-data-w-offsets (ir self))))

(define-constant +edge-label-type-map+
    '((#.proto:+edge-type-type-branch+ . :branch)
      (#.proto:+edge-type-type-call+ . :call)
      (#.proto:+edge-type-type-fallthrough+ . :fallthrough)
      (#.proto:+edge-type-type-return+ . :return)
      (#.proto:+edge-type-type-syscall+ . :syscall)
      (#.proto:+edge-type-type-sysret+ . :sysret))
  :test #'equal)

(define-proto-backed-class (edge-label proto:edge-label) () ()
    ((conditional :type boolean :documentation
                  "This is true if this edge is due to a conditional
instruction.")
     (direct :type boolean :documentation
             "Is this a direct (as opposed to indirect) control flow edge.")
     (edge-type :type enumeration :enumeration +edge-label-type-map+
                :proto-field type :documentation
                "The type of an edge indicates the nature of the
control flow along it.  E.g., \"branch,\" \"call,\" \"fallthrough,\"
and \"return\" are examples."))
  (:documentation "Label on a CFG edge.
This indicates the type of control flow along this edge."))

(defmethod print-object ((obj edge-label) stream)
  (print-unreadable-object (obj stream :type t :identity t)
    (format stream "~a ~:[unconditional~;conditional~] ~:[undirect~;direct~]"
            (edge-type obj) (conditional obj) (direct obj))))

(define-proto-backed-class (symbol proto:symbol) () ()
    ((name :type string)
     (value :type unsigned-byte-64)
     (referent-uuid :type uuid)
     (at-end :type boolean))
  (:documentation
   "Symbol with it's NAME and an optional VALUE or REFERENT.")
  (:parent module))

(defgeneric payload (symbol)
  (:documentation "Provide access to the referent or value of SYMBOL.")
  (:method ((symbol symbol))
    (cond
      ((proto:has-value (proto symbol))
       (value symbol))
      ((proto:has-referent-uuid (proto symbol))
       (get-uuid (referent-uuid symbol) symbol)))))

(defmethod (setf payload) ((new proto-backed) (symbol symbol))
  "Save GTIRB object NEW into the `referent-uuid' of SYMBOL."
  (proto:clear-value (proto symbol))
  (setf (referent-uuid symbol) (uuid new)))

(defmethod (setf payload) ((new integer) (symbol symbol))
  "Save INTEGER value NEW into the `value' of SYMBOL."
  (proto:clear-referent-uuid (proto symbol))
  (setf (value symbol) new))

(defmethod (setf payload) ((new t) (symbol symbol))
  (error "Symbol payload ~S must be either a GTIRB element or an integer." new))

(defmethod print-object ((obj symbol) stream)
  (print-unreadable-object (obj stream :type t :identity t)
    (format stream "~a ~a~:[~;|~]" (name obj)
            (or (value obj) (referent-uuid obj))
            (at-end obj))))

(define-constant +section-flags-map+
    '((#.proto:+section-flag-section-undefined+ . :flag-undefined)
      (#.proto:+section-flag-readable+ . :readable)
      (#.proto:+section-flag-writable+ . :writable)
      (#.proto:+section-flag-executable+ . :executable)
      (#.proto:+section-flag-loaded+ . :loaded)
      (#.proto:+section-flag-initialized+ . :initialized)
      (#.proto:+section-flag-thread-local+ . :thread-local))
  :test #'equal)

(define-proto-backed-class (section proto:section) ()
    ((byte-intervals
      :accessor byte-intervals :type list
      :from-proto
      [{map 'list
            {make-instance 'byte-interval :ir (ir self) :section self :proto}}
       #'proto:byte-intervals]
      :to-proto {map 'vector #'update-proto}
      :documentation "Byte-intervals holding all of the section's bytes."))
    ((name :type string :documentation "Name of this section.")
     (flags :type enumeration :enumeration +section-flags-map+
            :proto-field section-flags :documentation
            "Flags holding common properties of this section.
These flags only hold those section properties which are relatively
universal including read, write, execute permissions, whether the
section is loaded into memory at run-time or not, whether the section
is zero initialized, and whether the section is thread-local."))
  (:documentation "Section in a GTIRB IR instance.") (:parent module))

(defmethod print-object ((obj section) stream)
  (print-unreadable-object (obj stream :type t :identity t)
    (format stream "~a ~a" (name obj) (length (byte-intervals obj)))))

(defmethod address ((obj section))
  (extremum (mapcar #'address (byte-intervals obj)) #'<))

(defmethod size ((it section))
  (- (extremum (mapcar «+ #'address #'size» (byte-intervals it)) #'> :key #'car)
     (address it)))

(defgeneric blocks (obj)
  (:documentation "List of gtirb-byte-block objects in this object.
Primitive accessor for byte-interval.")
  (:method ((obj gtirb)) (mappend #'blocks (modules obj)))
  (:method ((obj module)) (mappend #'blocks (sections obj)))
  (:method ((obj section)) (mappend #'blocks (byte-intervals obj))))

(define-proto-backed-class (offset proto:offset) () ()
    ((element-id :type uuid)
     (displacement :type unsigned-byte-64))
  (:documentation "Offset into a GTIRB object."))

(define-constant +se-attribute-flag-map+
    '(
      (#.proto:+se-attribute-flag-got+ . :got)
      (#.proto:+se-attribute-flag-gotpc+ . :gotpc)
      (#.proto:+se-attribute-flag-gotoff+ . :gotoff)
      (#.proto:+se-attribute-flag-gotrel+ . :gotrel)
      (#.proto:+se-attribute-flag-plt+ . :plt)
      (#.proto:+se-attribute-flag-pltoff+ . :pltoff)
      (#.proto:+se-attribute-flag-pcrel+ . :pcrel)
      (#.proto:+se-attribute-flag-secrel+ . :secrel)
      (#.proto:+se-attribute-flag-tls+ . :tls)
      (#.proto:+se-attribute-flag-tlsgd+ . :tlsgd)
      (#.proto:+se-attribute-flag-tlsld+ . :tlsld)
      (#.proto:+se-attribute-flag-tlsldm+ . :tlsldm)
      (#.proto:+se-attribute-flag-tlscall+ . :tlscall)
      (#.proto:+se-attribute-flag-tlsdesc+ . :tlsdesc)
      (#.proto:+se-attribute-flag-tprel+ . :tprel)
      (#.proto:+se-attribute-flag-tpoff+ . :tpoff)
      (#.proto:+se-attribute-flag-dtprel+ . :dtprel)
      (#.proto:+se-attribute-flag-dtpoff+ . :dtpoff)
      (#.proto:+se-attribute-flag-dtpmod+ . :dtpmod)
      (#.proto:+se-attribute-flag-ntpoff+ . :ntpoff)
      (#.proto:+se-attribute-flag-page+ . :page)
      (#.proto:+se-attribute-flag-pageoff+ . :pageoff)
      (#.proto:+se-attribute-flag-call+ . :call)
      (#.proto:+se-attribute-flag-lo+ . :lo)
      (#.proto:+se-attribute-flag-hi+ . :hi)
      (#.proto:+se-attribute-flag-higher+ . :higher)
      (#.proto:+se-attribute-flag-highest+ . :highest)
      (#.proto:+se-attribute-flag-gotntpoff+ . :gotntpoff)
      (#.proto:+se-attribute-flag-indntpoff+ . :indntpoff)
      (#.proto:+se-attribute-flag-g0+ . :g0)
      (#.proto:+se-attribute-flag-g1+ . :g1)
      (#.proto:+se-attribute-flag-g2+ . :g2)
      (#.proto:+se-attribute-flag-g3+ . :g3)
      (#.proto:+se-attribute-flag-upper16+ . :upper16)
      (#.proto:+se-attribute-flag-lower16+ . :lower16)
      (#.proto:+se-attribute-flag-lo12+ . :lo12)
      (#.proto:+se-attribute-flag-lo15+ . :lo15)
      (#.proto:+se-attribute-flag-lo14+ . :lo14)
      (#.proto:+se-attribute-flag-hi12+ . :hi12)
      (#.proto:+se-attribute-flag-hi21+ . :hi21)
      (#.proto:+se-attribute-flag-s+ . :s)
      (#.proto:+se-attribute-flag-pg+ . :pg)
      (#.proto:+se-attribute-flag-nc+ . :nc)
      (#.proto:+se-attribute-flag-abs+ . :abs)
      (#.proto:+se-attribute-flag-prel+ . :prel)
      (#.proto:+se-attribute-flag-prel31+ . :prel31)
      (#.proto:+se-attribute-flag-target1+ . :target1)
      (#.proto:+se-attribute-flag-target2+ . :target2)
      (#.proto:+se-attribute-flag-sbrel+ . :sbrel)
      (#.proto:+se-attribute-flag-tlsldo+ . :tlsldo)
      (#.proto:+se-attribute-flag-hi16+ . :hi16)
      (#.proto:+se-attribute-flag-lo16+ . :lo16)
      (#.proto:+se-attribute-flag-gprel+ . :gprel)
      (#.proto:+se-attribute-flag-disp+ . :disp)
      (#.proto:+se-attribute-flag-ofst+ . :ofst)
      (#.proto:+se-attribute-flag-h+ . :h)
      (#.proto:+se-attribute-flag-l+ . :l)
      (#.proto:+se-attribute-flag-ha+ . :ha)
      (#.proto:+se-attribute-flag-high+ . :high)
      (#.proto:+se-attribute-flag-higha+ . :higha)
      (#.proto:+se-attribute-flag-highera+ . :highera)
      (#.proto:+se-attribute-flag-highesta+ . :highesta)
      (#.proto:+se-attribute-flag-tocbase+ . :tocbase)
      (#.proto:+se-attribute-flag-toc+ . :toc)
      (#.proto:+se-attribute-flag-notoc+ . :notoc))
  :test #'equal
  :documentation "See doc/general/SymbolicExpression.md for more details.")

(define-proto-backed-class (byte-interval proto:byte-interval) ()
    ((blocks :initarg :blocks :accessor blocks :type list
             :from-proto
             [{map 'list
                   (lambda (proto-block)
                     (let ((it (cond
                                 ((not (emptyp
                                        (proto:uuid (proto:data proto-block))))
                                  (make-instance 'data-block
                                    :ir (ir self)
                                    :byte-interval self
                                    :offset (proto:offset proto-block)
                                    :proto (proto:data proto-block)))
                                 ((not (emptyp
                                        (proto:uuid (proto:code proto-block))))
                                  (make-instance 'code-block
                                    :ir (ir self)
                                    :byte-interval self
                                    :offset (proto:offset proto-block)
                                    :proto (proto:code proto-block))))))
                       #+debug
                       (when (emptyp (proto:uuid (proto it)))
                         (warn "BAD BLOCK ~a with empty uuid from ~a.~%~A~%"
                               it (name (section self)) proto-block))
                       it))}
              #'proto:blocks]
             :to-proto
             {map 'vector
                  (lambda (gtirb-block)
                    (let ((it (make-instance 'proto:block)))
                      (setf (proto:offset it) (offset gtirb-block))
                      (etypecase gtirb-block
                        (code-block
                         (setf (proto:code it) (update-proto gtirb-block)))
                        (data-block
                         (setf (proto:data it) (update-proto gtirb-block))))
                      it))}
             :documentation
             "Blocks in this byte-interval.
This list could include `code-block' or `data-block' elements (which
both subclass the `gtirb-byte-block' class) but not `proxy-block'
elements as proxy blocks do not hold bytes.")
     (symbolic-expressions
      :accessor symbolic-expressions :type hash-table
      :initarg :symbolic-expressions
      :from-proto
      (lambda (proto &aux (table (make-hash-table)))
        (flet ((process-symbols (&rest symbols)
                 (mappend (lambda (uuid)
                            (if-let ((sym (get-uuid (uuid-to-integer uuid)
                                                    (ir self))))
                              (list sym)
                              (unless (emptyp uuid)
                                (warn "Symbol UUID ~S not found" uuid))))
                          symbols)))
          (dotimes (n (length (proto:symbolic-expressions proto)) table)
            (let* ((proto (aref (proto:symbolic-expressions proto) n))
                   (offset (proto:key proto))
                   (attribute-flags
                    (map 'list [#'cdr {assoc _ +se-attribute-flag-map+}]
                         (proto:attribute-flags (proto:value proto))))
                   (symbolic-expression (proto:value proto)))
              (setf (gethash offset table)
                    (cond
                      ((proto:has-addr-const symbolic-expression)
                       (make-instance 'sym-addr-const
                         :ir (ir self)
                         :attribute-flags attribute-flags
                         :symbols (process-symbols
                                   (proto:symbol-uuid
                                    (proto:addr-const symbolic-expression)))
                         :proto (proto:addr-const symbolic-expression)))
                      ((proto:has-addr-addr symbolic-expression)
                       (make-instance 'sym-addr-addr
                         :ir (ir self)
                         :attribute-flags attribute-flags
                         :symbols (process-symbols
                                   (proto:symbol1-uuid
                                    (proto:addr-addr symbolic-expression))
                                   (proto:symbol2-uuid
                                    (proto:addr-addr symbolic-expression)))
                         :proto (proto:addr-addr symbolic-expression)))
                      (t (assert "Symbolic expression of unknown kind."))))))))
      :to-proto
      [{map 'vector
            (lambda (pair)
              (destructuring-bind (offset . symbolic-expression) pair
                (flet ((force-attribute-flags-array (array)
                         (declare (type (simple-array) array))
                         (make-array (length array)
                                     :element-type `(mod ,(length +se-attribute-flag-map+))
                                     :initial-contents array)))
                  (let ((it (make-instance
                                'proto:byte-interval-symbolic-expressions-entry)))
                    (setf (proto:key it) offset
                          (proto:value it)
                          (let ((it (make-instance 'proto:symbolic-expression)))
                            (when (attribute-flags symbolic-expression)
                              (setf (proto:attribute-flags it)
                                    (force-attribute-flags-array
                                     (map 'vector
                                          [#'car {rassoc _ +se-attribute-flag-map+}]
                                          (attribute-flags symbolic-expression)))))
                            (etypecase symbolic-expression
                              (sym-addr-const
                               (setf (proto:addr-const it)
                                     (update-proto symbolic-expression)))
                              (sym-addr-addr
                               (setf (proto:addr-addr it)
                                     (update-proto symbolic-expression))))
                            it))
                    it))))}
       #'hash-table-alist]
      :documentation "Hash of symbolic-expressions keyed by offset."))
    ((addressp :type boolean :proto-field has-address
               :documentation
               "Does this byte-interval have an address.")
     (address :type unsigned-byte-64
              :documentation
              "Optionally specify the address in memory at which this
~ byte-interval should start.  Byte-intervals without address could
exist anywhere in memory.")
     (size :type unsigned-byte-64 :documentation
           "The size of this byte-interval.
It is possible for the size of a byte-interval to be larger than the
number of bytes in the byte interval's `contents' if portions of the
byte-interval are not represented statically but are zero-initialized
at runtime.")
     (contents :type bytes :documentation
               "A vector holding the actual bytes of this byte interval."))
  (:documentation "Byte-interval in a GTIRB instance.") (:parent section)
  (:address-range (when (addressp self)
                    (list (address self) (+ (address self) (size self))))))

(defmethod (setf size) :before (new (obj byte-interval))
  (restart-case
      (when (> (length (contents obj)) new)
        (error (make-condition 'ir
                               :message "size smaller than contents"
                               :object obj)))
    (truncate-contents ()
      :report "Truncate the contents of the byte-interval to the new size."
      (setf (contents obj) (subseq (contents obj) 0 new)))
    (ignore ()
      :report "Ignore and leave the byte-interval in an inconsistent state.")))

(defmethod print-object ((obj byte-interval) stream)
  (print-unreadable-object (obj stream :type t :identity t)
    (format stream "~a ~a"
            (if (addressp obj) (address obj) "?")
            (size obj))))

(defmethod address ((obj byte-interval))
  (when (addressp obj) (proto:address (proto obj))))

(defclass symbolic-expression ()
  ((symbols :accessor symbols :initarg :symbols :initform nil :type list
            :documentation "Symbol(s) appearing in this symbolic expression.")
   (attribute-flags :accessor attribute-flags :initarg :attribute-flags
                    :initform nil :type list
                    :documentation "Attributes holding the relocation type.")))

(defmethod print-object ((obj symbolic-expression) stream)
  (print-unreadable-object (obj stream :type t :identity t)
    (format stream "~a ~{~a~^, ~}" (offset obj) (symbols obj))))

;;; TODO: If we get symbolic expressions for these, then add the
;;; following to each `symbolic-expression' class:
;;;
;;;     (:parent byte-interval)
;;;     (:address-range (when-let ((range (addressp (byte-interval self))))
;;;                       (+ (offset self) (first range))))
;;;
;;; and then go back up and add ":byte-interval self" to their
;;; `make-instance' calls in byte-interval.
(define-proto-backed-class
    (sym-addr-const proto:sym-addr-const) (symbolic-expression) ()
    ((offset :type unsigned-byte-64))
  (:address-range (when (addressp (byte-interval self))
                    (let ((address (+ (address (byte-interval self))
                                      (offset self))))
                      (list address address)))))

(define-proto-backed-class
    (sym-addr-addr proto:sym-addr-addr) (symbolic-expression) ()
    ((offset :type unsigned-byte-64)
     (scale :type unsigned-byte-64))
  (:address-range (when (addressp (byte-interval self))
                    (let ((address (+ (address (byte-interval self))
                                      (offset self))))
                      (list address address)))))

(defmethod update-proto :before ((sym sym-addr-const))
  (setf (proto:symbol-uuid (proto sym))
        (integer-to-uuid (uuid (first (symbols sym))))))

(defmethod update-proto :before ((sym sym-addr-addr))
  (setf (proto:symbol1-uuid (proto sym))
        (integer-to-uuid (uuid (first (symbols sym))))
        (proto:symbol2-uuid (proto sym))
        (integer-to-uuid (uuid (second (symbols sym))))))

(defmethod update-proto :before ((sym sym-addr-const))
  (setf (proto:symbol-uuid (proto sym))
        (integer-to-uuid (uuid (first (symbols sym))))))

(defmethod update-proto :before ((sym sym-addr-addr))
  (setf (proto:symbol1-uuid (proto sym))
        (integer-to-uuid (uuid (first (symbols sym))))
        (proto:symbol2-uuid (proto sym))
        (integer-to-uuid (uuid (second (symbols sym))))))

(defclass gtirb-block () ())

(defclass gtirb-byte-block (gtirb-block) ()
  (:documentation "Super-class of the `code-block' and `data-block' classes.
This class abstracts over all GTIRB blocks which are able to hold bytes."))

(defmethod symbolic-expressions ((bb gtirb-byte-block))
  (nest
   (alist-hash-table)
   (remove-if-not [«and {< (offset bb)} {>= (+ (offset bb) (size bb))}» #'car])
   (hash-table-alist)
   (symbolic-expressions)
   (byte-interval bb)))

(defmethod address ((obj gtirb-byte-block))
  (when-let ((base-address (address (byte-interval obj))))
    (+ base-address (offset obj))))

(defgeneric bytes (object &optional start end)
  (:documentation "Return the bytes held by OBJECT.")
  (:method ((obj byte-interval) &optional (start 0) end)
    (if end
        (subseq (contents obj) start end)
        (subseq (contents obj) start)))
  (:method ((obj gtirb-byte-block) &optional (start 0) (end (size obj)))
    #+debug (format t "[~S] ~S:[~S:~S]<-[~S:~S]~%"
                    (proto:uuid (proto obj))
                    (name (section (byte-interval obj)))
                    (or (and (addressp (byte-interval obj))
                             (address (byte-interval obj)))
                        "?")
                    (size (byte-interval obj))
                    (offset obj) (size obj))
    (let* ((start (+ (offset obj) start))
           (end (+ (offset obj) end)))
      (assert (<= end (size (byte-interval obj))) (obj)
              "Block's end ~d exceeds size of containing byte-interval ~d."
              end (size (byte-interval obj)))
      (let ((real-end (length (contents (byte-interval obj)))))
        (cond
          ((<= end real-end)            ; Allocated bytes.
           (subseq (contents (byte-interval obj)) start end))
          ((<= start real-end) ; Both allocated and un-allocated bytes.
           (concatenate 'vector (subseq (contents (byte-interval obj)) start)
                        (make-array (- end real-end) :initial-element 0)))
          (t                          ; Un-allocated bytes, zero-fill.
           (make-array (size obj) :initial-element 0)))))))

(defun shift-subseq (sequence start end)
  "Return a copy of SEQUENCE bounded by START and END."
  (subseq sequence start end))

(defparameter *preserve-symbolic-expressions* nil
  "When true, (setf bytes) preserves symbolic expressions
intersecting the assigned part of the object.")

(define-setf-expander shift-subseq (sequence start end &environment env)
  "Update the subseq of SEQUENCE bounded by START and END."
  (multiple-value-bind (dummies vals newval setter getter)
      (get-setf-expansion sequence env)
    (declare (ignorable newval setter))
    (let ((store (gensym)))
      (values
       dummies                          ; Temporary variables
       vals                             ; Value forms.
       (list store)                     ; Store variables.
       `(progn
          (cond
            ((zerop ,start)
             (setf ,getter
                   (concatenate 'vector ,store (subseq ,getter ,end))))
            ((= (length ,store) (- ,end ,start))
             (setf (subseq ,getter ,start ,end) ,store))
            ((>= ,end (length ,getter))
             (setf ,getter
                   (concatenate 'vector (subseq ,getter 0 ,start) ,store)))
            (t (setf ,getter (concatenate 'vector
                                          (subseq ,getter 0 ,start)
                                          ,store
                                          (subseq ,getter ,end)))))
          ,store)                       ; Storing form.
       `(shift-subseq ,getter)))))      ; Accessing form.

(define-setf-expander bytes (sequence &optional (start 0) (end nil end-p)
                             &environment env)
  (multiple-value-bind (dummies vals newval setter getter)
      (get-setf-expansion sequence env)
    (declare (ignorable newval setter))
    (let ((store (gensym))
          (end (if end-p end `(length (bytes ,getter)))))
      (values
       dummies                          ; Temporary variables
       vals                             ; Value forms.
       (list store)                     ; Store variables.
       `(progn
          (etypecase ,getter
            (gtirb::byte-interval
             (setf (shift-subseq (contents ,getter) ,start ,end) ,store))
            (gtirb::gtirb-byte-block
             (with-slots (offset) ,getter
               (let ((original-offset offset))
                 (setf (shift-subseq (contents (byte-interval ,getter))
                                     (+ offset ,start) (+ offset ,end))
                       ,store)
                 (setf-bytes-after ,store (byte-interval ,getter)
                                   (+ offset ,start) (+ offset ,end))
                 ;; Ensure the offset for THIS block isn't pushed back change.
                 (setf offset original-offset)))))

          (setf-bytes-after ,store ,getter ,start ,end)
          ,store)                       ; Storing form.
       `(bytes ,getter)))))             ; Accessing form.

(defvar *update-aux-data-offsets* nil
  "Are offsets in AuxData tables updated as bytes are modified.")

(defgeneric setf-bytes-after (new object &optional start end)
  (:documentation
   "Update the offsets into BYTE-INTERVAL due to saving NEW into START END.")
  (:method (new (byte-interval byte-interval)
            &optional (start 0) (end (size byte-interval)))
    (setf (size byte-interval)
          (+ start (length new) (- (size byte-interval) end)))
    (let ((difference (- (length new) (- end start))))
      ;; Symbolic expressions.
      (nest (setf (symbolic-expressions byte-interval))
            (alist-hash-table)
            (mappend (lambda (pair)
                       (destructuring-bind (offset . sym-expr) pair
                         (cond
                           ((< offset start) (list (cons offset sym-expr)))
                           ((>= offset end)
                            (list (cons (+ offset difference) sym-expr)))
                           ;; Clear symbolic expressions in the modified range,
                           ;; unless *preserve-symbolic-expressions* is true.
                           (t (if *preserve-symbolic-expressions* (list pair) nil))))))
            (hash-table-alist (symbolic-expressions byte-interval)))
      (when *update-aux-data-offsets*
        ;; Update offsets in AuxData tables.
        (labels ((update-offset (data type)
                   (cond
                     ((and (listp type) (eql :mapping (car type)))
                      (nest (alist-hash-table)
                            (mapcar «cons
                                     [{update-offset _ (second type)} #'car]
                                     [{update-offset _ (third type)} #'cdr]»)
                            (hash-table-alist data)))
                     ((and (listp type) (eql :sequence (car type)))
                      (mapcar {update-offset _ (cdr type)} data))
                     ((eql :offset type)
                      ;; NOTE: Since we are already adjusting all
                      ;;       other code blocks and offsets are
                      ;;       currently stored by code block we only
                      ;;       need to update offsets in the current
                      ;;       code block.
                      ;; NOTE: Offsets are relative to the base of the
                      ;;       code block but START is relative to the
                      ;;       base of the byte-interval.
                      ;; NOTE: Only update offsets in the current
                      ;;       block.
                      (let* ((obj (get-uuid (first data) byte-interval))
                             (obj-start (if (typep obj 'gtirb-byte-block)
                                            (offset obj)
                                            most-positive-fixnum))
                             (obj-end (+ obj-start (size obj)))
                             (off (second data)))
                        (when (and
                               ;; Changes bytes intersect this block
                               (or (and (>= obj-start start)
                                        (<= obj-start end))
                                   (and (>= obj-end start)
                                        (<= obj-end end)))
                               ;; This offset is after the start
                               ;; of the changed bytes
                               (>= (+ (offset obj) off) start))
                          (incf (second data) difference)))
                      data)
                     (t data))))
          (mapcar
           (lambda (pair)
             (let ((table (cdr pair)))
               (setf (aux-data-data table)
                     (update-offset (aux-data-data table)
                                    (aux-data-type table)))))
           (aux-data-w-offsets (ir byte-interval)))))
      ;; Byte-Blocks.
      (mapc (lambda (bb)
              (with-slots (offset) bb
                (when (>= offset end)
                  (incf offset difference))))
            (blocks byte-interval)))
    new)
  (:method (new (bb gtirb-byte-block) &optional (start 0) (end (size bb)))
    ;; Update the size of the byte-block
    (setf (size bb) (+ start (length new) (- (size bb) end)))
    new))

(define-proto-backed-class (code-block proto:code-block) (gtirb-byte-block)
    ((offset :initarg :offset :accessor offset :type number
             :documentation
             "Offset into this block's bytes in the block's byte-interval."))
    ((size :type unsigned-byte-64
           :documentation "The length of the bytes held by this code block.")
     (decode-mode :type unsigned-byte-64 :documentation
                  "Only present on architecture with multiple decode-modes."))
  (:documentation "Code-block in a GTIRB IR instance.") (:parent byte-interval)
  (:address-range (when-let ((range (address-range (byte-interval self))))
                    (list (+ (offset self) (first range))
                          (+ (offset self) (size self) (first range))))))

(defmethod print-object ((obj code-block) stream)
  (print-unreadable-object (obj stream :type t :identity t)
    (format stream "~a ~a" (size obj) (decode-mode obj))))

(defgeneric entry-point (module)
  (:documentation "The code-block which is the entry point of MODULE.")
  (:method ((obj module))
    (get-uuid (uuid-to-integer (proto:entry-point (proto obj))) obj)))

(defmethod (setf entry-point) ((new code-block) (obj module))
  (proto:clear-entry-point (proto obj))
  (setf (proto:entry-point (proto obj)) (integer-to-uuid (uuid new))))

(define-proto-backed-class (data-block proto:data-block) (gtirb-byte-block)
    ((offset :initarg :offset :accessor offset :type number
             :documentation
             "Offset into this block's bytes in the block's byte-interval."))
    ((size :type unsigned-byte-64 :documentation
           "The length of the bytes held by this data block."))
  (:documentation "Data-block in a GTIRB IR instance.")
  (:parent byte-interval)
  (:address-range (when-let ((range (address-range (byte-interval self))))
                    (list (+ (offset self) (first range))
                          (+ (offset self) (size self) (first range))))))

(defmethod print-object ((obj data-block) stream)
  (print-unreadable-object (obj stream :type t :identity t)
    (format stream "~a" (size obj))))

(define-proto-backed-class (proxy-block proto:proxy-block) (gtirb-block) () ()
  (:documentation "Proxy-block in a GTIRB IR instance.")
  (:parent module))

(defmethod print-object ((obj proxy-block) stream)
  (print-unreadable-object (obj stream :type t :identity t)))


;;;; AuxData type and data handling.
(define-proto-backed-class (aux-data proto:aux-data) () () ())

(defmethod print-object ((obj aux-data) stream)
  (print-unreadable-object (obj stream :type t :identity t)
    (format stream "~a" (aux-data-type obj))))

(defun aux-data-from-proto (proto)
  (let ((p-aux-data (proto:aux-data proto))
        (aux-data '()))
    (dotimes (n (length p-aux-data))
      (push (cons (pb:string-value (proto:key (aref p-aux-data n)))
                  (make-instance 'aux-data
                    :proto (proto:value (aref p-aux-data n))))
            aux-data))
    aux-data))

(defun aux-data-to-proto (aux-data)
  (map 'vector (lambda (pair)
                 (destructuring-bind (name . aux-data) pair
                   (let ((entry
                          (make-instance 'proto:module-aux-data-entry)))
                     (setf (proto:key entry) (pb:string-field name)
                           (proto:value entry) (proto aux-data))
                     entry)))
       aux-data))

(defmacro start-case (string &body body)
  `(progn
     ;; (declare (type string ,string))
     (assert (stringp ,string) (,string) "Argument ~s is not a string." ,string)
     (cond
       ,@(mapcar (lambda (form)
                   (destructuring-bind (prefix . body) form
                     (if (stringp prefix)
                         `((eql (search ,prefix ,string) 0)
                           (let ((,string (subseq ,string ,(length prefix))))
                             ,@body))
                         (cons prefix body))))
                 body))))

(defparameter +integer-typename-regex+ (create-scanner "(U?INT)([0-9]+)-T")
  "Regex for deconstructing an integer typename.")

(defun matching (open-char close-char string)
  "Return the first balanced offset of CLOSE-CHAR in STRING.
STRING is assumed to already have one extant OPEN-CHAR which needs to
be matched.  New instances of OPEN-CHAR must be closed by balanced
CLOSE-CHARs before the CLOSE-CHAR matching the implicit extant
OPEN-CHAR."
  (let ((offset 1))
    (dotimes (n (length string))
      (cond
        ((eql (aref string n) open-char) (incf offset))
        ((eql (aref string n) close-char) (decf offset)))
      (when (zerop offset)
        (return-from matching n))))
  (error "Can't close (~a ~a) in ~s." open-char close-char string))

(defun aux-data-type-read (type-string)
  (when (and type-string (not (emptyp type-string)))
    (start-case type-string
      ("mapping<"
       (let ((close (matching #\< #\> type-string)))
         (cons (cons :mapping (aux-data-type-read (subseq type-string 0 close)))
               (aux-data-type-read (subseq type-string close)))))
      ("set<"
       (let ((close (matching #\< #\> type-string)))
         (cons (cons :set (aux-data-type-read (subseq type-string 0 close)))
               (aux-data-type-read (subseq type-string close)))))
      ("sequence<"
       (let ((close (matching #\< #\> type-string)))
         (cons (cons :sequence (aux-data-type-read (subseq type-string 0 close)))
               (aux-data-type-read (subseq type-string close)))))
      ("tuple<"
       (let ((close (matching #\< #\> type-string)))
         (cons (cons :tuple (aux-data-type-read (subseq type-string 0 close)))
               (aux-data-type-read (subseq type-string close)))))
      ("variant<"
       (let ((close (matching #\< #\> type-string)))
         (cons (cons :variant (aux-data-type-read (subseq type-string 0 close)))
               (aux-data-type-read (subseq type-string close)))))
      ("," (aux-data-type-read type-string))
      (">" (aux-data-type-read type-string))
      ("UUID" (cons :uuid (aux-data-type-read type-string)))
      ("Addr" (cons :addr (aux-data-type-read type-string)))
      ("Offset" (cons :offset (aux-data-type-read type-string)))
      ("string" (cons :string (aux-data-type-read type-string)))
      ("bool" (cons :bool (aux-data-type-read type-string)))
      ("uint8_t" (cons :uint8-t (aux-data-type-read type-string)))
      ("uint16_t" (cons :uint16-t (aux-data-type-read type-string)))
      ("uint32_t" (cons :uint32-t (aux-data-type-read type-string)))
      ("uint64_t" (cons :uint64-t (aux-data-type-read type-string)))
      ("int8_t" (cons :int8-t (aux-data-type-read type-string)))
      ("int16_t" (cons :int16-t (aux-data-type-read type-string)))
      ("int32_t" (cons :int32-t (aux-data-type-read type-string)))
      ("int64_t" (cons :int64-t (aux-data-type-read type-string)))
      ("float" (cons :float (aux-data-type-read type-string)))
      ("double" (cons :double (aux-data-type-read type-string)))
      (t (error "Junk in type string ~a" type-string)))))

(defgeneric aux-data-type (aux-data)
  (:documentation "Access the structured type of AUX-DATA.")
  (:method ((obj aux-data))
    (first (aux-data-type-read
            (pb:string-value (proto:type-name (proto obj)))))))

(defun aux-data-type-print (stream
                            type
                            &optional
                              colon-modifier-supplied-p
                              at-sign-modifier-supplied-p
                              (repetitions 1))
  (declare (type (or null (eql t) stream string) stream))
  (declare (ignorable colon-modifier-supplied-p at-sign-modifier-supplied-p repetitions))
  (when type
    (if (listp type)
        (case (first type)
          (:mapping
           (format stream "mapping<~/gtirb:aux-data-type-print/,~/gtirb:aux-data-type-print/>"
                   (second type)
                   (third type)))
          (:set (format stream "set<~/gtirb:aux-data-type-print/>" (second type)))
          (:sequence (format stream "sequence<~/gtirb:aux-data-type-print/>" (second type)))
          (:tuple (format stream "tuple<~{~/gtirb:aux-data-type-print/~^,~}>" (cdr type)))
          (:variant (format stream "variant<~{~/gtirb:aux-data-type-print/~^,~}>" (cdr type))))
        (format stream (ecase type
                         (:uuid "UUID")
                         (:addr "Addr")
                         (:offset "Offset")
                         (:string "string")
                         (:bool "bool")
                         (:uint8-t "uint8_t")
                         (:uint16-t "uint16_t")
                         (:uint32-t "uint32_t")
                         (:uint64-t "uint64_t")
                         (:int8-t "int8_t")
                         (:int16-t "int16_t")
                         (:int32-t "int32_t")
                         (:int64-t "int64_t")
                         (:float "float")
                         (:double "double"))))))

(defmethod (setf aux-data-type) (new (obj aux-data))
  (setf (proto:type-name (proto obj))
        (pb:string-field (format nil "~/gtirb::aux-data-type-print/" new))))

(defgeneric aux-data-data (aux-data)
  (:documentation "Access the structured representation of AUX-DATAs data.")
  (:method ((obj aux-data))
    (aux-data-decode (aux-data-type obj) (proto:data (proto obj)))))

(defmethod (setf aux-data-data) (new (obj aux-data))
  (setf (proto:data (proto obj))
        (force-byte-array (aux-data-encode (aux-data-type obj) new))))

(defun parse-num-bytes (num-bits-string)
  (/ (parse-integer num-bits-string) 8))

(declaim (special *decode-data*))
(defun decode (type)
  (labels ((advance (n) (setf *decode-data* (subseq *decode-data* n)))
           (decode-int (type)
             (register-groups-bind (type-signage (#'parse-num-bytes num-bytes))
                 (+integer-typename-regex+ (symbol-name type))
               (prog1
                   (if (string= type-signage "UINT")
                       (octets->uint (subseq *decode-data* 0 num-bytes)
                                     num-bytes)
                       (octets->int (subseq *decode-data* 0 num-bytes)
                                    num-bytes))
                 (advance num-bytes)))))
    (declare (inline advance))
    (match type
      ((or :uint8-t :int8-t :uint16-t :int16-t
           :uint32-t :int32-t :uint64-t :int64-t)
       (decode-int type))
      (:float
       (decode-float32 (decode-int :uint32-t)))
      (:double
       (decode-float64 (decode-int :uint64-t)))
      (:addr
       (prog1
           (octets->uint (subseq *decode-data* 0 8) 8)
         (advance 8)))
      (:bool
       (prog1
           (not (zerop (octets->uint (subseq *decode-data* 0 1) 1)))
         (advance 1)))
      (:uuid
       (prog1 (uuid-to-integer (subseq *decode-data* 0 16)) (advance 16)))
      (:offset
       (handler-bind
           ((error
             (lambda (e)
               (declare (ignorable e))
               (let* ((offset (make-instance 'proto:offset))
                      (size (pb:octet-size offset)))
                 (pb:merge-from-array offset *decode-data* 0 size)
                 (prog1 offset (advance size))))))
         (list (decode :uuid) (decode :uint64-t))))
      (:string
       (let ((size (decode :uint64-t)))
         (prog1 (utf-8-bytes-to-string (subseq *decode-data* 0 size))
           (advance size))))
      ((list :mapping key-t value-t)
       (let ((result (make-hash-table :test #'equal)))
         (dotimes (n (decode :uint64-t) result)
           (declare (ignorable n))
           (let* ((key (decode key-t))
                  (value (decode value-t)))
             (setf (gethash key result) value)))))
      ((list (or :sequence :set) type)
       (let (result)
         (reverse
          (dotimes (n (decode :uint64-t) result)
            (declare (ignorable n))
            (push (decode type) result)))))
      ((list* :tuple types)
       (mapcar #'decode types))
      ((list* :variant types)
       (let ((index (decode :uint64-t)))
         (cons index (decode (nth index types))))))))
(defun aux-data-decode (type data)
  (let ((*decode-data* data))
    (decode type)))

(defun encode (type data)
  (labels ((extend (it) (push it *decode-data*))
           (encode-int (type data)
             (register-groups-bind (_ (#'parse-num-bytes num-bytes))
                 (+integer-typename-regex+ (symbol-name type))
               (declare (ignorable _))
               (extend (int->octets data num-bytes)))))
    (declare (inline extend))
    (match type
      ((or :uint8-t :int8-t :uint16-t :int16-t
           :uint32-t :int32-t :uint64-t :int64-t)
       (encode-int type data))
      (:float
       (encode-int :uint32-t (encode-float32 data)))
      (:double
       (encode-int :uint64-t (encode-float64 data)))
      (:addr
       (extend (int->octets data 8)))
      (:bool
       (extend (int->octets (if data 1 0) 1)))
      (:uuid
       (extend (integer-to-uuid data)))
      (:offset
       (etypecase data
         (proto:offset
          (let* ((size (pb:octet-size data))
                 (buffer (make-array size :element-type '(unsigned-byte 8))))
            (pb:serialize data buffer 0 size)
            (extend buffer)))
         (list
          (progn (encode :uuid (first data))
                 (encode :uint64-t (second data))))))
      (:string
       (let ((string-bytes (string-to-utf-8-bytes data)))
         (encode :uint64-t (length string-bytes))
         (extend string-bytes)))
      ((list :mapping key-t value-t)
       (encode :uint64-t (hash-table-count data))
       (maphash (lambda (key value)
                  (encode key-t key)
                  (encode value-t value))
                data))
      ((list (or :sequence :set) type)
       (let ((size (length data)))
         (encode :uint64-t size)
         (dotimes (n size)
           (encode type (elt data n)))))
      ((list* :tuple types)
       (mapc (lambda (type datum)
               (encode type datum))
             types data))
      ((list* :variant types)
       (encode :uint64-t (car data))
       (encode (nth (car data) types) (cdr data))))))
(defun aux-data-encode (type data)
  (let ((*decode-data* nil))
    (encode type data)
    (reduce {concatenate 'vector} (reverse *decode-data*))))


================================================
FILE: cl/package.lisp
================================================
(defpackage :gtirb
  (use-package :common-lisp))


================================================
FILE: cl/ranged.lisp
================================================
(defpackage :gtirb/ranged
  (:use :common-lisp)
  (:import-from :interval)
  (:export :make-ranged
           :ranged-insert
           :ranged-delete
           :ranged-find
           :ranged-find-at))
(in-package :gtirb/ranged)
#-debug (declaim (optimize (speed 3) (safety 0) (debug 0)))
#+debug (declaim (optimize (speed 0) (safety 3) (debug 3)))

(defun make-ranged ()
  (interval:make-tree))

(defstruct (uuid-interval (:include interval:interval))
  (uuid 0 :type integer))

(defun uuid-interval= (i1 i2)
  (= (uuid-interval-uuid i1) (uuid-interval-uuid i2)))

(defun ranged-insert (tree uuid start end)
  (interval:insert tree (make-uuid-interval :uuid uuid
                                            :start start
                                            :end end)))

(defun ranged-delete (tree uuid start end)
  (interval:delete tree (make-uuid-interval :uuid uuid
                                            :start start
                                            :end end)))

(defun ranged-find-at (tree address)
  (mapcar #'uuid-interval-uuid
          (remove-if-not (lambda (i)
                           (= address (interval:interval-start i)))
                         (interval:find-all tree address))))

(defun ranged-find (tree start &optional (end start))
  (mapcar #'uuid-interval-uuid (interval:find-all tree (cons start end))))


================================================
FILE: cl/test.lisp
================================================
(defpackage :gtirb/test
  (:use :common-lisp
        :alexandria
        :flexi-streams
        :stefil
        :gtirb
        :gtirb/dot
        :gtirb/utility
        :gtirb/ranged
        :gtirb/version
        :graph
        :named-readtables :curry-compose-reader-macros)
  (:import-from :trivial-package-local-nicknames :add-package-local-nickname)
  (:import-from :gtirb.proto)
  (:import-from :gtirb/utility :check-magic-header :write-magic-header)
  (:import-from :md5 :md5sum-file :md5sum-sequence)
  (:import-from :uiop :nest :run-program :with-temporary-file :quit)
  (:import-from :asdf/system :system-relative-pathname)
  (:shadowing-import-from :gtirb :symbol)
  (:export :test :batch-test))
(in-package :gtirb/test)
(in-readtable :curry-compose-reader-macros)

(eval-when (:compile-toplevel :load-toplevel :execute)
  (add-package-local-nickname :proto :gtirb.proto))

(defvar *proto-path* nil "Path to protobuf.")

(defun batch-test (&optional args)
  "Run tests in 'batch' mode printing results to STDERR then quit.
The ERRNO used when exiting lisp indicates success or failure."
  (declare (ignorable args))
  (let* ((stefil::*test-progress-print-right-margin* (expt 2 20))
         (failures (coerce (stefil::failure-descriptions-of
                            (without-debugging (test)))
                           'list)))
    (if failures
        (format *error-output* "FAILURES~%~{  ~a~~%~}"
                (mapc [#'stefil::name-of
                       #'stefil::test-of
                       #'car #'stefil::test-context-backtrace-of]
                      failures))
        (format *error-output* "SUCCESS~%"))
    (quit (if failures 2 0))))

(defvar *gtirb-dir* (system-relative-pathname "gtirb" "../"))


;;;; Fixtures.
(defixture hello
  (:setup
   (progn
     #+live-w-ddisasm
     (with-temporary-file (:pathname bin-path)
       (setf *proto-path* (with-temporary-file (:pathname p :keep t) p))
       (run-program (format nil "echo 'main(){puts(\"hello world\");}'~
                                     |gcc -x c - -o ~a"
                            bin-path) :force-shell t)
       (run-program
        (format nil "ddisasm --ir ~a ~a" *proto-path* bin-path)))
     #-live-w-ddisasm
     (setf *proto-path*
           (merge-pathnames "python/tests/hello.gtirb" *gtirb-dir*))))
  (:teardown
   (progn
     #+live-w-ddisasm (delete-file *proto-path*)
     (setf *proto-path* nil))))


;;;; Main test suite.
(defsuite test)
(in-suite test)

(deftest we-have-versions ()
  (is (stringp gtirb-version))
  (is (integerp protobuf-version)))

(deftest simple-read ()
  (with-fixture hello
    (is (eql 'proto:ir
             (class-name (class-of (read-proto 'proto:ir *proto-path*)))))))

(deftest simple-write ()
  (with-fixture hello
    (with-temporary-file (:pathname path)
      (gtirb::write-proto (read-proto 'proto:ir *proto-path*) path)
      (is (probe-file path)))))

(deftest idempotent-read-write ()
  (with-fixture hello
    (with-temporary-file (:pathname path)
      (gtirb::write-proto (read-proto 'proto:ir *proto-path*) path)
      ;; Protobuf provides multiple options for serializing repeated
      ;; enums, so this check can fail even with valid serialization.
      #+inhibited
      (is (equalp (md5sum-file *proto-path*)
                  (md5sum-file path))))))

(deftest read-gtirb-from-streams-and-files ()
  (with-fixture hello
    (is (typep (read-gtirb *proto-path*) 'gtirb))
    (is (typep (read-gtirb (namestring *proto-path*)) 'gtirb))
    (is (typep (with-open-file (input *proto-path*) (read-gtirb input))
               'gtirb))))

(deftest idempotent-read-write-w-class ()
  (nest
   (with-fixture hello)
   (with-temporary-file (:pathname path))
   (let ((hello1 (read-gtirb *proto-path*)))
     (write-gtirb hello1 path)
     (is (is-equal-p hello1 (read-gtirb path))))))

(deftest idempotent-aux-data-type ()
  (with-fixture hello
    (let ((it (read-gtirb *proto-path*)))
      (is (tree-equal
           (mapcar [#'pb:string-value #'proto:type-name #'gtirb::proto #'cdr]
                   (aux-data (first (modules it))))
           (mapcar [{format nil "~/gtirb::aux-data-type-print/"} #'aux-data-type #'cdr]
                   (aux-data (first (modules it))))
           :test #'string=)))))

(deftest idempotent-aux-data-decode-encode ()
  (let ((type1 '(:tuple :uuid :uint64-t :int64-t :uint64-t))
        (type2 '(:sequence :uuid))
        (type3 '(:sequence (:variant :uuid :string)))
        (data '(1 2 3 4))
        (data2 '((0 . 1) (1 . "foo") (0 . 3) (1 . "bar"))))
    (is (equalp
         (gtirb::aux-data-decode type1 (gtirb::aux-data-encode type1 data))
         data))
    (is (equalp
         (gtirb::aux-data-decode type2 (gtirb::aux-data-encode type2 data))
         data))
    (is (equalp
         (gtirb::aux-data-decode type3 (gtirb::aux-data-encode type3 data2))
         data2)))
  (with-fixture hello
    (let ((hello (read-gtirb *proto-path*)))
      (mapc (lambda (pair)
              (destructuring-bind (name . aux-data) pair
                (let* ((orig (proto:data (gtirb::proto aux-data)))
                       (type (aux-data-type aux-data))
                       (new (gtirb::aux-data-encode
                             type (aux-data-data aux-data))))
                  (is (equalp (gtirb::aux-data-decode type new)
                              (gtirb::aux-data-decode type orig))
                      "~s with type ~a encodes/decodes is not idempotent~%~s"
                      name (aux-data-type aux-data)
                      (list (gtirb::aux-data-decode type orig)
                            (gtirb::aux-data-decode type new))))))
            (aux-data (first (modules hello)))))))

(deftest test-check-magic-header ()
  (is (signals gtirb-magic-error
        (check-magic-header #())))
  (is (signals gtirb-magic-error
        (check-magic-header #(0 0 0 0 0 0 0 0))))
  (is (signals gtirb-magic-error
        (check-magic-header #(71 84 73 82 66 0 0 0))))
  (is (null (check-magic-header (vector 71 84 73 82 66 0 0 protobuf-version)))))

(deftest test-write-magic-header ()
  (with-output-to-sequence (out)
    (write-magic-header out)
    (is (equalp (get-output-stream-sequence out)
                (vector 71 84 73 82 66 0 0 protobuf-version)))))

(deftest update-proto-to-disk-and-back ()
  (nest
   (with-fixture hello)
   (with-temporary-file (:pathname path))
   (let ((test-string "this is a test")
         (hello (read-gtirb *proto-path*))
         (aux (make-instance 'aux-data)))
     (setf (aux-data-type aux) :string)
     (setf (aux-data-data aux) test-string)
     (push (cons "test" aux) (aux-data (first (modules hello))))
     (write-gtirb hello path)
     (let* ((next (read-gtirb path))
            (proto (gtirb::proto (first (modules next)))))
       ;; Test for non-empty protobuf elements.
       (is (not (zerop (length (proto:byte-intervals (aref (proto:sections proto) 0))))))
       ;; Test for the aux-data table created earlier in the test.
       (is (string= (aux-data-data
                     (cdr (assoc "test" (aux-data (first (modules next)))
                                 :test #'string=)))
                    test-string))))))

(deftest create-module-with-a-name ()
  (is (string= "foo"
               (nest
                (pb:string-value)
                (proto:name)
                (gtirb::proto)
                (make-instance 'module :name "foo" :allow-other-keys t)))))

;; FIXME: create-module-without-a-name should verify that the appropriate
;; warning is emitted, but for some reason the warning doesn't percolate up
;; to the point where the signals testing macro is able to catch it.
(deftest create-module-without-a-name ()
  (is (emptyp (nest
               (pb:string-value)
               (proto:name)
               (gtirb::proto)
               (make-instance 'module)))))

(deftest entry-points-on-modules ()
  (with-fixture hello
    (let* ((hello (read-gtirb *proto-path*))
           (module (first (modules hello)))
           (code-block (nest (first)
                             (remove-if-not {typep _ 'code-block})
                             (blocks hello))))
      ;; Entry-point is read as a code block.
      (is (typep (entry-point module) 'code-block))
      ;; Newly saved entry-point has the UUID of the code block.
      (setf (entry-point module) code-block)
      (is (= (uuid code-block)
             (uuid-to-integer (proto:entry-point (gtirb::proto module))))))))

(deftest back-pointers-work ()
  (with-fixture hello
    (let ((hello (read-gtirb *proto-path*)))
      ;; Modules point to IR.
      (is (every [{eql hello} #'gtirb] (modules hello)))
      ;; Sections point to modules.
      (mapc (lambda (module)
              (is (every [{eql module} #'module] (sections module)))
              ;; Byte-intervals point to sections.
              (mapc (lambda (section)
                      (is (every [{eql section} #'section]
                                 (byte-intervals section)))
                      ;; Blocks point to byte-intervals.
                      (mapc (lambda (byte-interval)
                              (is (every [{eql byte-interval} #'byte-interval]
                                         (blocks byte-interval))))
                            (byte-intervals section)))
                    (sections module)))
            (modules hello)))))

(deftest access-block-bytes ()
  (with-fixture hello
    (is (every [#'not #'null #'bytes]
               (blocks (read-gtirb *proto-path*))))))

(deftest find-every-block-in-the-module ()
  (nest (with-fixture hello)
        (let ((it (read-gtirb *proto-path*))))
        (is)
        (every {get-uuid _ it})
        (mapcar #'uuid)
        (blocks it)))

(deftest get-blocks-and-bytes-from-cfg-nodes ()
  (nest (with-fixture hello)
        (let ((it (read-gtirb *proto-path*))))
        (is)
        (every {get-uuid _ it})
        (nodes)
        (cfg it)))

(deftest shift-subseq-adds-and-removes-as-expected ()
  (let ((it #(1 2 3 4 5)))
    (setf (gtirb::shift-subseq it 2 3) #(9 9 9 9))
    (is (equalp it #(1 2 9 9 9 9 4 5))))
  (let ((it #(1 2 3 4 5)))
    (setf (gtirb::shift-subseq it 2 3) #())
    (is (equalp it #(1 2 4 5)))))

(deftest set-block-bytes-to-the-same-size ()
  (with-fixture hello
    (let* ((it (read-gtirb *proto-path*))
           (original-byte-intervals (nest (mappend #'byte-intervals)
                                          (mappend #'sections)
                                          (modules it)))
           (original-byte-interval-md5sum
            (nest (md5sum-sequence)
                  (force-byte-array)
                  (apply #'concatenate 'vector)
                  (mapcar #'contents original-byte-intervals))))
      (let ((target (first (mappend #'blocks original-byte-intervals))))
        (setf (bytes target)
              (make-array (length (bytes target)) :initial-element 9))
        (is (= (length original-byte-intervals) ; No new byte intervals.
               (length (nest (mappend #'byte-intervals)
                             (mappend #'sections)
                             (modules it)))))
        (is (not (equalp original-byte-interval-md5sum ; New contents.
                         (nest (md5sum-sequence)
                               (force-byte-array)
                               (apply #'concatenate 'vector)
                               (mapcar #'contents)
                               (mappend #'byte-intervals)
                               (mappend #'sections)
                               (modules it)))))))))

(deftest set-block-bytes-to-the-different-size ()
  (with-fixture hello
    (let* ((it (read-gtirb *proto-path*))
           (original-byte-intervals (nest (mappend #'byte-intervals)
                                          (mappend #'sections)
                                          (modules it)))
           (target (first (mappend #'blocks original-byte-intervals)))
           (original-bi-size (size (byte-interval target)))
           (original-bi-bytes (bytes (byte-interval target)))
           (original-size (length (bytes target)))
           (rest-block-bytes
            (cdr (mapcar #'bytes (blocks (byte-interval target))))))
      (setf (bytes target) (make-array (* 2 original-size) :initial-element 9))
      ;; First block bytes are updated.
      (is (equalp (bytes (first (mappend #'blocks original-byte-intervals)))
                  (make-array (* 2 original-size) :initial-element 9)))
      ;; Block size is updated.
      (is (equalp (size target) (* 2 original-size)))
      ;; Byte-interval size is updated.
      (is (equalp (size (byte-interval target))
                  (+ original-bi-size original-size)))
      ;; Remainder of the byte-interval's bytes are the same.
      (is (equalp (subseq (bytes (byte-interval target)) (* 2 original-size))
                  (subseq original-bi-bytes original-size)))
      ;; Remaining blocks bytes are the same.
      (is (every #'equalp
                 rest-block-bytes
                 (cdr (mapcar #'bytes (blocks (byte-interval target)))))))))

(deftest address-range-block-lookup ()
  (with-fixture hello
    (let* ((it (read-gtirb *proto-path*))
           (a-block (first (blocks it))))
      (is (= 2 (length (address-range a-block))))
      (is (member a-block (nest (mappend #'blocks)
                                (on-address it)
                                (first)
                                (address-range a-block))))
      (is (member a-block (nest (mappend #'blocks)
                                (at-address it)
                                (first)
                                (address-range a-block))))
      (is (not (member a-block (nest (mappend #'blocks)
                                     (at-address it)
                                     (second)
                                     (address-range a-block))))))))

(deftest symbolic-expressions-pushed-back ()
  (with-fixture hello
    ;; Collect a byte-interval with offset symbolic expressions.
    (let* ((bi (nest (find-if [{some [#'not #'zerop #'car]}
                               #'hash-table-alist #'symbolic-expressions])
                     (cdr) (mappend #'byte-intervals)
                     (sections) (first) (modules)
                     (read-gtirb *proto-path*)))
           (original-length (length (bytes bi)))
           (original-offsets (hash-table-keys (symbolic-expressions bi)))
           (largest-offset (extremum original-offsets #'>))
           (smallest-offset (extremum original-offsets #'<)))
      ;; Add bytes after the last symbol.
      (setf (bytes bi largest-offset largest-offset)
            (make-array 2 :initial-element 9))
      ;; Ensure bytes have been altered.
      (is (> (length (bytes bi)) original-length))
      ;; Ensure symbolic expressions before last have not moved.
      (is (set-equal (remove (+ largest-offset 2)
                             (hash-table-keys (symbolic-expressions bi)))
                     (remove largest-offset original-offsets)))
      ;; Remove those added bytes
      (setf (bytes bi largest-offset (+ largest-offset 2)) #())
      ;; Add bytes at the beginning.
      (setf (bytes bi 0 0) (make-array 1 :initial-element 9))
      ;; Ensure symbolic expressions have actually been pushed back.
      (is (set-equal (mapcar #'1+ original-offsets)
                     (hash-table-keys (symbolic-expressions bi))))
      ;; Drop bytes at the beginning.
      (setf (bytes bi 0 (1+ smallest-offset)) #())
      ;; Ensure this symbolic expression now starts at the beginning.
      (is (zerop (extremum (hash-table-keys (symbolic-expressions bi))
                           #'<))))))

(defvar *listing-comments*)
(defun get-listing-comments (it)
  (when-let ((table (assoc "comments" (gtirb::aux-data-w-offsets (ir it))
                           :test #'equalp)))
    (hash-table-alist (aux-data-data (cdr table)))))
(defmethod listing :around (object &key stream comments)
  (declare (ignorable stream comments))
  (let ((*listing-comments* (if (boundp '*listing-comments*)
                                *listing-comments*
                                (get-listing-comments object))))
    (call-next-method)))
(defgeneric listing (OBJECT &key stream comments)
  (:documentation "Print a listing of OBJECT.")
  (:method ((self gtirb) &key (stream t) comments)
    (format stream "~&IR~%")
    (mapc {listing _ :stream stream :comments comments} (modules self)))
  (:method ((self module) &key (stream t) comments)
    (format stream "~&Module: ~S~%" (name self))
    (mapc {listing _ :stream stream :comments comments} (sections self)))
  (:method ((self section) &key (stream t) comments)
    (format stream "~&Section: ~S" (name self))
    (mapc {listing _ :stream stream :comments comments} (byte-intervals self)))
  (:method ((self byte-interval) &key (stream t) comments)
    (format stream "~:[ (no address)~; at ~a~]~%" (addressp self) (address self))
    (mapc {listing _ :stream stream :comments comments} (blocks self)))
  (:method ((self gtirb-byte-block) &key (stream t) comments)
    (let ((bytes (bytes self))
          (comments (when comments
                      (remove-if-not [{= (uuid self)} #'caar] *listing-comments*))))
      (dotimes (step (size self))
        (format stream (if (zerop step) "~&>" " "))
        (if-let ((comment (and comments (find-if [{= step} #'cadar] comments))))
          (format stream "~4X ; ~A~%" (aref bytes step) (cdr comment))
          (format stream "~4X" (aref bytes step)))
        (when (= 7 (mod step 8)) (format stream "~&"))))))

(defun block-comments (data-block it)
  (sort (nest (remove-if-not [{= (uuid data-block)} #'caar])
              (hash-table-alist)
              (aux-data-data) (cdr)
              (assoc "comments" (gtirb::aux-data-w-offsets (ir it))
                     :test #'equalp))
        #'< :key [#'second #'car]))

(deftest offsets-pushed-back ()
  (nest (let ((gtirb::*update-aux-data-offsets* t)))
        (with-fixture hello)
        (let* ((it (read-gtirb *proto-path*))
               (text (find-if [{string= ".text"} #'name]
                              (sections (first (modules it)))))
               (commented-block (find-if {block-comments _ it} (blocks text)))
               (comment (first (block-comments commented-block it)))
               (starting-offset (cadar comment)))
          (is (gtirb::get-aux-data-w-offsets it)
              "We're finding aux-data tables with offsets. ~
             Should be at least comments and cfiDirectives.")
          (is (gtirb::aux-data-w-offsets it)
              "The `aux-data-w-offsets' was populated.")
          #+nil (listing commented-block :comments t)
          (setf (bytes commented-block 0 0) #(0 0 0 0))
          #+nil (listing commented-block :comments t)
          (is (= (+ 4 starting-offset)
                 (cadar (first (block-comments commented-block it))))))))

(deftest block-symbolic-expressions ()
  (with-fixture hello
    (is (nest (mappend [#'hash-table-values #'symbolic-expressions])
              (mappend #'blocks) (mappend #'byte-intervals)
              (sections) (first) (modules)
              (read-gtirb *proto-path*)))))

(deftest symbolic-expressions-maintained ()
  (nest
   (with-fixture hello)
   (mapc (lambda (db)
           (let ((o-offset (offset db))
                 (o-bi-size (size (byte-interval db)))
                 (o-db-size (size db))
                 (o-bi-se-size (hash-table-size
                                (symbolic-expressions (byte-interval db))))
                 (o-se-size (hash-table-size
                             (symbolic-expressions db))))
             (setf (bytes db 0 0) #(#x90 #x90 #x90 #x90))
             (is (= o-offset (offset db)))
             (is (= (+ 4 o-bi-size) (size (byte-interval db))))
             (is (= (+ 4 o-db-size) (size db)))
             (is (= o-bi-se-size
                    (hash-table-size
                     (symbolic-expressions (byte-interval db)))))
             (is (= o-se-size
                    (hash-table-size
                     (symbolic-expressions db)))))))
   (blocks (read-gtirb *proto-path*))))

(deftest payload-can-be-read-and-set ()
  (with-fixture hello
    (let* ((it (read-gtirb *proto-path*))
           (symbols (mappend #'symbols (modules it)))
           (referent-symbol
            (find-if [#'proto:has-referent-uuid #'gtirb::proto] symbols)))
      ;; Reading gives the right type of payload.
      (is (subtypep (type-of (payload referent-symbol)) 'gtirb::proto-backed))
      ;; Setting a payload has the right effect.
      (setf (payload referent-symbol) 42) ; Referent to value.
      (is (subtypep (type-of (payload referent-symbol)) 'number))
      (is (not (proto:has-referent-uuid (gtirb::proto referent-symbol)))))))

(deftest can-create-without-parents ()
  (is (typep (make-instance 'module) 'module))
  (is (typep (make-instance 'section) 'section))
  (is (typep (make-instance 'byte-interval) 'byte-interval)))

(deftest direct-ir-access ()
  (with-fixture hello
    (let* ((it (read-gtirb *proto-path*)))
      (is (typep (ir (setf it (first (modules it)))) 'gtirb))
      (is (typep (ir (setf it (first (sections it)))) 'gtirb))
      (is (typep (ir (setf it (first (byte-intervals it)))) 'gtirb))
      (is (typep (ir (setf it (first (blocks it)))) 'gtirb)))))

(deftest every-symbolic-expression-has-symbols ()
  (flet ((every-symbolic-expression-has-symbols-proto (path)
           (every (lambda (se)
                    (cond
                      ((proto:has-addr-const se)
                       (proto:symbol-uuid (proto:addr-const se)))
                      ((proto:has-addr-addr se)
                       (proto:symbol1-uuid (proto:addr-addr se)))))
                  (nest
                   (mapcar #'proto:value)
                   (mappend [{coerce _ 'list} #'proto:symbolic-expressions])
                   (mappend [{coerce _ 'list} #'proto:byte-intervals])
                   (coerce (proto:sections
                            (aref (proto:modules
                                   (read-proto 'proto:ir path)) 0))
                           'list))))
         (every-symbolic-expression-has-symbols-gtirb (path)
           (nest (every #'symbols)
                 (mappend [#'hash-table-values #'symbolic-expressions])
                 (mappend #'byte-intervals)
                 (mappend #'sections)
                 (modules (read-gtirb path)))))
    (with-fixture hello
      ;; First confirm for the protobuf
      (is (every-symbolic-expression-has-symbols-proto *proto-path*))
      ;; Second confirm for the GTIRB representation.
      (is (every-symbolic-expression-has-symbols-gtirb *proto-path*))
      ;; Then re-confirm both for a rewritten protobuf file.
      (uiop:with-temporary-file (:pathname temporary-file)
        (write-gtirb (read-gtirb *proto-path*) temporary-file)
        (is (every-symbolic-expression-has-symbols-proto temporary-file))
        (is (every-symbolic-expression-has-symbols-gtirb temporary-file))))))

#+ignore-expected-failure
(deftest every-block-is-found-at-its-address ()
  (with-fixture hello
    (let ((it (read-gtirb *proto-path*)))
      (nest (is)
            (every «member #'identity [{at-address it} #'address]»)
            (mappend #'blocks)
            (mappend #'byte-intervals)
            (mappend #'sections)
            (modules it)))))

(deftest truncating-size-on-byte-interval-errors-and-truncates ()
  (with-fixture hello
    (let ((byte-intervals (nest (mappend #'byte-intervals)
                                (mappend #'sections)
                                (modules)
                                (read-gtirb *proto-path*))))
      ;; Truncation signals an error.
      (signals ir
        (setf (size (first byte-intervals))
              (1- (length (contents (first byte-intervals))))))
      ;; Truncate restart works.
      (let* ((bi (second byte-intervals))
             (original-length (length (contents bi))))
        (handler-bind
            ((ir
              (lambda (e)
                (if (find-restart 'truncate-contents)
                    (invoke-restart 'truncate-contents)
                    (error e)))))
          (setf (size bi) (1- original-length)))
        (is (= original-length
               (+ 1 (size bi))
               (+ 1 (length (contents bi))))))
      ;; Ignore restart works.
      (let* ((bi (third byte-intervals))
             (original-length (length (contents bi))))
        (handler-bind
            ((ir
              (lambda (e)
                (if (find-restart 'ignore)
                    (invoke-restart 'ignore)
                    (error e)))))
          (setf (size bi) (1- original-length)))
        (is (= original-length (length (contents bi))))
        (is (> original-length (size bi)))))))


;;;; Dot test suite
(deftest write-dot-to-file ()
  (with-fixture hello
    (with-temporary-file (:pathname path)
      (to-dot-file (read-gtirb *proto-path*) path))))


================================================
FILE: cl/update.lisp
================================================
(defpackage :gtirb/update
  (:use :common-lisp
        :alexandria
        :gtirb/utility
        :named-readtables
        :curry-compose-reader-macros
        :command-line-arguments)
  (:import-from :serapeum :take-while)
  (:import-from :gtirb.proto)
  (:import-from :trivial-package-local-nicknames :add-package-local-nickname)
  (:import-from :proto-v0)
  (:import-from :uiop :nest)
  (:import-from :uiop/image :quit)
  (:import-from :gtirb
                :aux-data :aux-data-type :aux-data-data
                :+module-file-format-map+)
  (:export :update :upgrade :read-proto :write-proto))
(in-package :gtirb/update)
(in-readtable :curry-compose-reader-macros)

(eval-when (:compile-toplevel :load-toplevel :execute)
  (add-package-local-nickname :proto :gtirb.proto)
  (defparameter +udpate-args+
    '((("help" #\h #\?) :type boolean :optional t
       :documentation "display help output"))))

(defun module-bytes-subseq (module start end &aux (results #()))
  (let ((regions (proto-v0:regions (proto-v0:byte-map
                                    (proto-v0:image-byte-map module)))))
    (force-byte-array
     (dotimes (n (length regions) results)
       (let* ((region (aref regions n))
              (address (proto-v0:address region))
              (size (length (proto-v0:data region))))
         (cond
           ((and (<= address start) (< start (+ address size)))
            (setf results (concatenate 'vector
                                       results
                                       (subseq (proto-v0:data region)
                                               (- start address)
                                               (min size (- end address)))))
            (setf start (min end (+ address size))))
           ((= start end) (return results))))))))

(defun byte-interval (module section
                      &aux (new (make-instance 'proto:byte-interval)))
  (let ((address (proto-v0:address section))
        (size (proto-v0:size section)))
    (setf (proto:uuid new) (new-uuid)
          (proto:address new) address
          (proto:has-address new) (proto-v0:has-address section)
          (proto:size new) size
          (proto:contents new)
          (module-bytes-subseq module address (+ address size))
          (proto:symbolic-expressions new)
          (map 'vector {upgrade _ :base address}
               (remove-if-not [«and {<= address} {>= (+ address size)}» #'proto-v0:key]
                              (proto-v0:symbolic-operands module)))
          (proto:blocks new)
          (map 'vector (lambda (block)
                         (etypecase block
                           (proto-v0:block
                               (let ((it (make-instance 'proto:block)))
                                 (setf (proto:code it)
                                       (upgrade block)
                                       (proto:offset it)
                                       (- (proto-v0:address block) address))
                                 it))
                           (proto-v0:data-object
                            (let ((it (make-instance 'proto:block)))
                              (setf (proto:data it)
                                    (upgrade block :base address)
                                    (proto:offset it)
                                    (- (proto-v0:address block) address))
                              it))))
               (remove-if-not
                (lambda (block)
                  (let ((addr (proto-v0:address block)))
                    (and (<= address addr)
                         (< addr (+ address size)))))
                (concatenate 'vector
                             (proto-v0:blocks module)
                             (proto-v0:data module))))))
  (coerce (list new) 'vector))

(defun entry-point (module)
  (when-let ((address (proto-v0:entry-point-address
                       (proto-v0:image-byte-map module))))
    (if-let ((gtirb-block
              (find-if
               «and [{< address} «+ #'proto-v0:address #'proto-v0:size»]
                    [{>= address} #'proto-v0:address]»
               (proto-v0:blocks module))))
      (proto-v0:uuid gtirb-block)
      (if (zerop address)
          (warn "Zero address found in module ~S, assuming not an entry point."
                (pb:string-value (proto-v0:name module)))
          (error "No block found holding module ~S entry point ~a."
                 (pb:string-value (proto-v0:name module))
                 address)))))

(defmacro transfer-fields (new old &rest fields)
  `(progn
     ,@(mapcar (lambda (field)
                 `(setf (,(intern (symbol-name field) 'proto) ,new)
                        (upgrade (,(intern (symbol-name field) 'proto-v0) ,old))))
               fields)))

#+debug
(defun serial (it)
  "Useful to ensure yourself of what protobuf serialization is producing."
  (let* ((size (pb:octet-size it))
         (buffer (make-array size :element-type '(unsigned-byte 8))))
    (pb:serialize it buffer 0 size)
    buffer))

#+debug
(defun deserial (class bytes &aux (it (make-instance class)))
  "Useful to ensure yourself of what protobuf deserialization is producing."
  (pb:merge-from-array it bytes 0 (length bytes))
  it)

(defun combine-cfgs (cfgs)
  (let ((it (make-instance 'proto:cfg)))
    (setf (proto:edges it)
          (coerce (mappend [{coerce _ 'list} #'proto:edges] cfgs) 'vector))
    (setf (proto:vertices it)
          (coerce (mappend [{coerce _ 'list} #'proto:vertices] cfgs) 'vector))
    it))

(define-constant +symbol-storage-kind+
    '((#.proto-v0:+storage-kind-storage-undefined+ . :undefined)
      (#.proto-v0:+storage-kind-storage-normal+ . :normal)
      (#.proto-v0:+storage-kind-storage-static+ . :static)
      (#.proto-v0:+storage-kind-storage-extern+ . :extern)
      (#.proto-v0:+storage-kind-storage-local+ . :local))
  :test #'equal)

(defvar *code-block-uuids* (make-hash-table))
(defvar *data-block-uuids* (make-hash-table))

(defun storage-kind (symbol)
  (cdr (assoc (proto-v0:storage-kind symbol) +symbol-storage-kind+)))

(defun elf-symbol-info (symbol)
  "Return an elfSymbolInfo entry for SYMBOL using its `proto-v0:storage-kind'."
  (list
   0
   ;; Point to data "OBJ," if it points to a code "FUNC," else "NOTYPE."
   (cond
     ((gethash (proto-v0:uuid symbol) *data-block-uuids*) "OBJ")
     ((gethash (proto-v0:uuid symbol) *code-block-uuids*) "FUNC")
     (t "NOTYPE"))
   (ecase (storage-kind symbol)
     ((:normal :static) "GLOBAL")
     (:local "LOCAL"))
   (ecase (storage-kind symbol)
     (:normal "DEFAULT")
     ((:local :static) "HIDDEN"))
   0))

(defun update-padding-table (data offset-bases)
  "Convert DATA which is keyed by addresses to be keyed by offset.
Use OFFSET-BASES, an alist of base address and byte-interval, to do
this conversion."
  (let* ((it (make-instance 'aux-data :proto data))
         (data (aux-data-data it)))
    (nest (setf (aux-data-type it) '(:mapping :offset :uint64-t)
                (aux-data-data it))
          (alist-hash-table)
          (mapcar (lambda (pair)
                    (destructuring-bind (addr . value) pair
                      (let ((base (nest (lastcar)
                                        (take-while [{> addr} #'car])
                                        offset-bases)))
                        (destructuring-bind (base . id) base
                          (cons
                           (let ((it (make-instance 'proto:offset)))
                             (setf (proto:element-id it) id)
                             (setf (proto:displacement it) (- addr base))
                             it)
                           value))))))
          (hash-table-alist)
          data)
    (gtirb::proto it)))

(defun offset-bases (new-sections)
  (nest (apply #'append)
        (map 'list (lambda (section)
                     (map 'list (lambda (bi)
                                  (assert (proto:has-address bi))
                                  (cons (proto:address bi)
                                        (proto:uuid bi)))
                          (proto:byte-intervals section))))
        new-sections))

(defgeneric upgrade (object &key &allow-other-keys)
  (:documentation "Upgrade OBJECT to the next protobuf version.")
  (:method ((old t) &key &allow-other-keys) old)
  (:method ((old array) &key  &allow-other-keys)
    (if (every #'numberp old)
        (force-byte-array old)
        (map 'vector #'upgrade old)))
  (:method ((old proto-v0:ir) &key &allow-other-keys
            &aux (new (make-instance 'proto:ir)))
    (setf (proto:uuid new) (proto-v0:uuid old)
          (proto:version new) 1
          (proto:aux-data new) (upgrade (proto-v0:aux-data-container old)
                                        :new-class 'proto:ir-aux-data-entry)
          (proto:modules new) (upgrade (proto-v0:modules old))
          (proto:cfg new) (combine-cfgs (map 'list [#'upgrade #'proto-v0:cfg]
                                             (proto-v0:modules old))))
    new)
  (:method ((old proto-v0:module) &key &allow-other-keys
            &aux (new (make-instance 'proto:module)))
    (transfer-fields new old
                     uuid binary-path preferred-addr rebase-delta file-format
                     name symbols proxies name)
    (let ((new-sections (map 'vector {upgrade _ :module old}
                             (proto-v0:sections old))))
      (setf (proto:isa new) (proto-v0:isa-id old)
            (proto:aux-data new)
            (upgrade (proto-v0:aux-data-container old)
                     :new-class 'proto:module-aux-data-entry
                     :offset-bases (offset-bases new-sections))
            (proto:sections new) new-sections))
    (if-let ((entry-point (entry-point old)))
      (setf (proto:entry-point new) entry-point))
    ;; Add a symbolType AuxData table of type mapping<UUID, string> to
    ;; track the storage kinds of all symbols.
    (ecase (cdr (assoc (proto-v0:file-format old) +module-file-format-map+))
      (:elf
       (let ((ad (make-instance 'aux-data))
             (ade (make-instance 'proto:module-aux-data-entry)))
         (setf (aux-data-type ad)
               '(:mapping :uuid
                 (:tuple :uint64-t :string :string :string :uint64-t))
               (aux-data-data ad)
               (alist-hash-table
                (map 'list «cons [#'uuid-to-integer #'proto-v0:uuid]
                                 #'elf-symbol-info»
                     (remove-if [{eql :extern} #'storage-kind]
                                (proto-v0:symbols old)))))
         (setf (proto:key ade) (pb:string-field "elfSymbolInfo")
               (proto:value ade) (gtirb::proto ad))
         (setf (proto:aux-data new)
               (coerce (append (list ade) (coerce (proto:aux-data new) 'list))
                       'vector))))
      (:pe (flet ((symbols-to-aux-data (name symbols)
                    (let ((ad (make-instance 'aux-data))
                          (ade (make-instance 'proto:module-aux-data-entry)))
                      (setf (aux-data-type ad) '(:set :uuid)
                            (aux-data-data ad) symbols
                            (proto:key ade) (pb:string-field name)
                            (proto:value ade) (gtirb::proto ad))
                      ade)))
             (let ((in (symbols-to-aux-data
                        "peImportedSymbols"
                        (nest
                         (mapcar [#'uuid-to-integer #'proto-v0:uuid])
                         (remove-if-not [{member _ '(:local :static)}
                                         #'storage-kind])
                         (proto-v0:symbols old))))
                   (out (symbols-to-aux-data
                         "peExportedSymbols"
                         (nest
                          (mapcar [#'uuid-to-integer #'proto-v0:uuid])
                          (remove-if-not [{member _ '(:normal :extern)}
                                          #'storage-kind])
                          (proto-v0:symbols old)))))
               (setf (proto:aux-data new)
                     (coerce (append (list in out)
                                     (coerce (proto:aux-data new) 'list))
                             'vector))))))
    new)
  (:method ((old proto-v0:aux-data-container) &key new-class offset-bases
                                                &allow-other-keys)
    (map 'vector (lambda (entry)
                   (let ((it (make-instance new-class)))
                     (let ((new-value (upgrade (proto-v0:value entry))))
                       (when (string= "padding"
                                      (pb:string-value (proto-v0:key entry)))
                         (setf new-value (update-padding-table
                                          new-value offset-bases)))
                       (setf (proto:key it) (proto-v0:key entry)
                             (proto:value it) new-value))
                     it))
         (proto-v0:aux-data old)))
  (:method ((old proto-v0:aux-data) &key &allow-other-keys
            &aux (new (make-instance 'proto:aux-data)))
    (transfer-fields new old type-name data)
    new)
  (:method ((old proto-v0:section) &key module &allow-other-keys
            &aux (new (make-instance 'proto:section)))
    (transfer-fields new old uuid name)
    (setf (proto:byte-intervals new) (byte-interval module old))
    new)
  (:method ((old proto-v0:edge-label) &key &allow-other-keys
            &aux (new (make-instance 'proto:edge-label)))
    (transfer-fields new old conditional direct type)
    new)
  (:method ((old proto-v0:edge) &key &allow-other-keys
            &aux (new (make-instance 'proto:edge)))
    (transfer-fields new old source-uuid target-uuid label)
    new)
  (:method ((old proto-v0:cfg) &key &allow-other-keys
            &aux (new (make-instance 'proto:cfg)))
    (transfer-fields new old vertices edges)
    new)
  (:method ((old proto-v0:module-symbolic-operands-entry)
            &key base &allow-other-keys
            &aux (new (make-instance
                          'proto:byte-interval-symbolic-expressions-entry)))
    (setf (proto:key new) (- (proto-v0:key old) base)
          (proto:value new) (upgrade (proto-v0:value old)))
    new)
  (:method ((old proto-v0:symbol) &key &allow-other-keys
            &aux (new (make-instance 'proto:symbol)))
    (transfer-fields new old uuid name)
    (cond                ; Variant "oneof" 'value' or 'referent_uuid'.
      ((proto-v0:has-value old)
       (setf (proto:value new) (proto-v0:value old)))
      ((proto-v0:has-referent-uuid old)
       (setf (proto:referent-uuid new) (upgrade (proto-v0:referent-uuid old))
             ;; This field was added after GTIRB-V.0.
             (proto:at-end new) nil)))
    new)
  (:method ((old proto-v0:symbolic-expression) &key &allow-other-keys
            &aux (new (make-instance 'proto:symbolic-expression)))
    (cond                               ; Variant "oneof" field.
      ((proto-v0:has-addr-const old)
       (setf (proto:addr-const new) (upgrade (proto-v0:addr-const old))))
      ((proto-v0:has-addr-addr old)
       (setf (proto:addr-addr new) (upgrade (proto-v0:addr-addr old))))
      (t (warn "Symbolic expressions ~s has no value." old)))
    #+debug
    (progn     ; Potentially useful debug pattern to inspect protobuf.
      (format t "~%~%~%OLD:~S~%" (serial old))
      (describe old)
      (format t "~%NEW:~S~%" (serial new))
      (describe new))
    new)
  (:method ((old proto-v0:sym-addr-const) &key &allow-other-keys
            &aux (new (make-instance 'proto:sym-addr-const)))
    (transfer-fields new old symbol-uuid)
    new)
  (:method ((old proto-v0:sym-addr-addr) &key &allow-other-keys
            &aux (new (make-instance 'proto:sym-addr-addr)))
    (transfer-fields new old scale offset symbol1-uuid symbol2-uuid)
    new)
  (:method ((old proto-v0:block) &key &allow-other-keys
            &aux (new (make-instance 'proto:code-block)))
    (setf (gethash (proto-v0:uuid old) *code-block-uuids*) t)
    (transfer-fields new old uuid size decode-mode)
    new)
  (:method ((old proto-v0:data-object) &key &allow-other-keys
            &aux (new (make-instance 'proto:data-block)))
    (setf (gethash (proto-v0:uuid old) *data-block-uuids*) t)
    (transfer-fields new old uuid size)
    new))

(define-command update (input-file output-file &spec +udpate-args+)
  "Update GTIRB protobuf from INPUT-FILE to OUTPUT-FILE." ""
  (when help (show-help-for-update) (quit))
  (setf *random-state* (make-random-state t))
  (write-proto (upgrade (read-proto 'proto-v0:ir input-file)) output-file))


================================================
FILE: cl/utility.lisp
================================================
(defpackage :gtirb/utility
  (:use :common-lisp
        :gtirb/version)
  (:import-from :cl-intbytes
                :int->octets
                :octets->int)
  (:import-from :alexandria
                :define-constant
                :read-stream-content-into-byte-vector
                :read-file-into-byte-vector
                :starts-with-subseq)
  (:import-from :uiop :nest)
  (:import-from :uiop/stream :file-stream-p)
  (:export :read-proto
           :write-proto
           :gtirb-magic-error
           :new-uuid
           :force-byte-array
           :uuid-to-integer
           :integer-to-uuid))
(in-package :gtirb/utility)
(declaim (optimize (speed 3) (safety 0) (debug 0)))

(define-constant gtirb-magic-octets #(71 84 73 82 66) ;; "GTIRB"
  :test #'equalp
  :documentation "GTIRB file magic bytes at beginning of magic header.")

(define-constant gtirb-magic-length 8
  :test #'equal
  :documentation "Number of bytes in the GTIRB file magic header.")

(define-condition gtirb-magic-error (error)
  ((message :initarg :message :initform nil :reader message))
  (:report (lambda (condition stream)
             (format stream "~S" (message condition))))
  (:documentation "Condition raised if GTIRB header is invalid."))

(defgeneric read-proto (class source)
  (:documentation "Read protobuf object of class CLASS from SOURCE.")
  (:method :before
    (class (path pathname))
    (declare (ignorable class))
    (assert (probe-file path) (path)
            "Can't read Protobuf from ~s, because the file doesn't exist."
            path))
  (:method (class (path string)) (read-proto class (pathname path)))
  (:method (class (path pathname))
    (with-open-file (input path :direction :input :element-type 'unsigned-byte)
      (read-proto class input)))
  (:method (class (input stream))
    (read-proto class (if (file-stream-p input)
                          (read-file-into-byte-vector input)
                          (read-stream-content-into-byte-vector input))))
  (:method (class (buffer array) &aux (gtirb (make-instance class)))
    (check-magic-header buffer)
    (pb:merge-from-array gtirb buffer gtirb-magic-length (length buffer))
    gtirb))

(defun write-proto (object path)
  "Write OBJECT to PATH."
  (let* ((size (pb:octet-size object))
         (buffer (make-array size :element-type '(unsigned-byte 8))))
    (pb:serialize object buffer 0 size)
    (with-open-file (output path
                            :direction :output :if-exists :supersede
                            :element-type 'unsigned-byte)
      (write-magic-header output)
      (write-sequence buffer output)))
  (values))

(defun new-uuid (&aux (it (make-array 16 :element-type '(unsigned-byte 8))))
  "Return a new random UUID."
  (dotimes (n 16 it) (setf (aref it n) (random 256))))

(defun force-byte-array (array)
  "Force ARRAY into a byte array."
  (declare (type (simple-array) array))
  (make-array (length array) :element-type '(unsigned-byte 8)
              :initial-contents array))

(defun uuid-to-integer (uuid)
  (declare (type (simple-array) uuid))
  (if (zerop (length uuid))
      (prog1 0 #+debug (warn "Bad null UUID."))
      (octets->int (force-byte-array uuid) 16)))

(defun integer-to-uuid (number)
  (int->octets number 16))

(defun check-magic-header (bytes)
  "Check if the GTIRB magic header bytes are present in at the start of BYTES,
throwing a GTIRB-MAGIC-ERROR if the header is not present."
  (when (or (< (length bytes) gtirb-magic-length)
            (not (starts-with-subseq gtirb-magic-octets bytes)))
    (error (make-condition 'gtirb-magic-error
                           :message "File missing GTIRB magic - not a GTIRB file?")))
  (when (not (equal protobuf-version (aref bytes (1- gtirb-magic-length))))
    (error (nest (make-condition 'gtirb-magic-error :message)
                 (format nil "Attempt to decode IR of version ~d (expected version ~d)"
                         (aref bytes (1- gtirb-magic-length))
                         protobuf-version)))))

(defun write-magic-header (stream)
  "Write the GTIRB magic header bytes to STREAM."
  (write-sequence gtirb-magic-octets stream)
  (write-byte 0 stream)
  (write-byte 0 stream)
  (write-byte protobuf-version stream))


================================================
FILE: cl/validate.lisp
================================================
(defpackage :gtirb/validate
  (:use :gt/full :gtirb :graph :command-line-arguments)
  (:import-from :gtirb.proto)
  (:shadowing-import-from :gt/full :size :copy)
  (:shadowing-import-from :gtirb :symbol)
  (:export :validate))
(in-package :gtirb/validate)
(in-readtable :curry-compose-reader-macros)
(defmethod size ((gtirb-node gtirb-node)) (gtirb:size gtirb-node))
(defmethod copy ((graph graph) &key &allow-other-keys) (graph:copy graph))


;;;; Interface
(defvar *requirements* nil
  "A-list of default requirements keyed by object type.")

(defvar *failed-checks*)

(defgeneric validate (object &key requirements)
  (:documentation "Validate that OBJECT satisfies the requirements in .")
  (:method
      ((object t) &key (requirements *requirements*) &aux (*failed-checks* nil))
    (values (every {check object} (cdr (assoc (type-of object) requirements)))
            *failed-checks*)))

(defclass check ()
  ((action :reader action :initarg :action
           :type (or symbol function) :documentation "Action to run the check.")
   (object :reader object :initarg :object
           :type symbol :documentation "Type of object the check applies to.")
   (name :reader name :initarg :name
         :type string :documentation "Name of the check."))
  (:documentation "Check objects hold validation checks for gtirb instances."))

(defmethod initialize-instance :after
    ((check check) &key (requirements *requirements*) &allow-other-keys)
  (unless (assoc (object check) requirements)
    (push (list (object check)) requirements))
  (pushnew check (cdr (assoc (object check) requirements)) :key #'name))

(defgeneric check (object requirement)
  (:documentation "Check that OBJECT satisfies REQUIREMENT.")
  (:method ((obj t) (requirement symbol)) (funcall requirement obj))
  (:method ((obj t) (requirement function)) (funcall requirement obj))
  (:method ((obj t) (requirement check)) (funcall (action requirement) obj)))

(defmethod check :around ((object t) (requirement function))
  (or (call-next-method) (push requirement *failed-checks*)))
(defmethod check :around ((object t) (requirement check))
  (or (call-next-method) (push (name requirement) *failed-checks*)))


;;;; GTIRB Checks
(defmacro define-check-generic (name (object) &body methods)
  `(progn (defgeneric ,name (,object) ,@methods)
          (make-instance 'check
            :name ',name
            :action ',name
            :object ',(second (first (second (first methods)))))))

(define-check-generic size-matches-contents (object)
  (:method ((obj gtirb)) (every #'size-matches-contents (modules obj)))
  (:method ((obj module)) (every #'size-matches-contents (sections obj)))
  (:method ((obj section)) (every #'size-matches-contents (byte-intervals obj)))
  (:method ((obj byte-interval)) (= (size obj) (length (contents obj)))))

(flet ((nothing-overlaps- (things &aux (min 0))
         (and (every (lambda (pair)
                       (destructuring-bind (address . size) pair
                         (prog1 (>= address min)
                           (setf min (max min (+ address size))))))
                     (sort (mapcar «cons #'address #'size» things) #'<
                           :key #'car))
              (every #'nothing-overlaps things))))
  (define-check-generic nothing-overlaps (object)
    (:method ((obj gtirb)) (every #'nothing-overlaps (modules obj)))
    (:method ((obj module)) (nothing-overlaps- (sections obj)))
    (:method ((obj section)) (nothing-overlaps- (byte-intervals obj)))
    (:method ((obj byte-interval))
      (nothing-overlaps- (remove-if-not {typep _ 'code-block} (blocks obj))))
    (:method ((obj code-block)) t)))

(define-check-generic all-referents-exist (object)
  (:method ((obj gtirb))
    (and (every #'all-referents-exist (modules obj))
         (every {get-uuid _ obj} (nodes (cfg obj)))))
  (:method ((obj module)) (every #'all-referents-exist (symbols obj)))
  (:method ((obj symbol))
    (if (gtirb.proto:has-referent-uuid (gtirb::proto obj))
        (payload obj)
        t)))

(define-check-generic symbolic-expression-size-well-formed (object)
  (:method ((obj gtirb))
    (every [{every «member #'second
                           [#'hash-table-keys #'symbolic-expressions
                                              {get-uuid _ obj} #'car]»}
            #'hash-table-keys #'aux-data-data #'cdr
            (lambda (el) (assoc "symbolicExpressionSizes" el :test #'string=))
            #'aux-data]
           (modules obj))))


;;;; Command-line interface
(eval-when (:compile-toplevel :load-toplevel :execute)
  (defparameter +validate-args+
    '((("help" #\h #\?) :type boolean :optional t
       :documentation "display help output"))))

(define-command validate-file (gtirb-file &spec +validate-args+)
  "Validate GTIRB-FILE." ""
  (flet ((exit (code)
           (if *lisp-interaction*
               (return-from validate-file (zerop code))
               (quit code))))
    (when help (show-help-for-validate-file) (quit))
    (if (validate (read-gtirb gtirb-file))
        (exit 0)
        (exit 2))))


================================================
FILE: cl/version.lisp
================================================
(defpackage :gtirb/version
  (:use :common-lisp)
  (:import-from :alexandria
                :define-constant)
  (:import-from :asdf/system :system-relative-pathname)
  (:import-from :uiop :nest)
  (:export :gtirb-version
           :protobuf-version))
(in-package :gtirb/version)

(eval-when (:compile-toplevel :load-toplevel :execute)
  (defvar version.txt
    `#.(nest (let ((version-path
                    (system-relative-pathname "gtirb" "../version.txt"))))
             (with-open-file (in version-path))
             (loop for line = (read-line in nil :eof)
                until (eql line :eof)
                collect (let ((delim (position #\Space line)))
                          (cons (intern (subseq line 0 delim))
                                (parse-integer (subseq line (1+ delim)))))))))

(define-constant gtirb-version
    (format nil "~d.~d.~d"
            (cdr (assoc 'VERSION_MAJOR version.txt))
            (cdr (assoc 'VERSION_MINOR version.txt))
            (cdr (assoc 'VERSION_PATCH version.txt)))
  :test #'string=
  :documentation "GTIRB Version as a string of \"MAJOR.MINOR.PATCH\".")

(define-constant protobuf-version
    (cdr (assoc 'VERSION_PROTOBUF version.txt))
  :test #'=
  :documentation "GTIRB Protobuf Version as a non-negative integer.")


================================================
FILE: conanfile.py
================================================
import os
import re

from conans import CMake, ConanFile, tools
from conans.errors import ConanInvalidConfiguration
from conans.model.version import Version


def get_gtirb_version():
    if "CI_COMMIT_REF_NAME" in os.environ:
        branch = os.environ["CI_COMMIT_REF_NAME"]
        if branch == "master":
            return "dev"
    try:
        with open("version.txt") as f:
            s = f.read()
            match = re.search(
                r"VERSION_MAJOR(\s+)(\S+)(\s+)"
                r"VERSION_MINOR(\s+)(\S+)(\s+)"
                r"VERSION_PATCH(\s+)(\S+)(\s+)",
                s,
            )
            if match:
                major = match.group(2)
                minor = match.group(5)
                patch = match.group(8)
                return major + "." + minor + "." + patch
            else:
                return "<ERROR: no version found in version.txt>"
    except Exception:
        return "<ERROR: version.txt not found>"


def branch_to_channel(branch):
    if re.match(r"^release-.*", branch):
        return "stable"
    else:
        return branch.replace("/", "+")


class Properties:
    name = "gtirb"
    rel_url = "rewriting/gtirb"
    exports_sources = "*", "!*_CPack_Packages*", "!*java*.class"

    @property
    def version(self):
        if not hasattr(self, "_version"):
            self._version = get_gtirb_version()
        return self._version

    @version.setter
    def version(self, ver):
        self._version = ver

    @property
    def description(self):
        return "%s library" % self.name

    @property
    def url(self):
        return "https://git.grammatech.com/%s" % self.rel_url

    @property
    def conan_channel(self):
        channel = "local"
        if "CI_COMMIT_REF_NAME" in os.environ:
            branch = os.environ["CI_COMMIT_REF_NAME"]
            channel = branch_to_channel(branch)
        return channel

    @property
    def archived_channels(self):
        # Add to this list branch names to have conan packages for
        # branches archived in gitlab.
        archived_branches = ["master"]
        # Also, archive the 'stable' channel, where all stable versions
        # will be uploaded
        archived_channels = ["stable"]
        return archived_channels + list(
            map(branch_to_channel, archived_branches)
        )

    @property
    def conan_ref(self):
        channel = self.conan_channel
        return "%s/%s" % (self.rel_url.replace("/", "+"), channel)

    @property
    def conan_recipe(self):
        return "%s/%s@%s" % (self.name, self.version, self.conan_ref)


class GtirbConan(Properties, ConanFile):
    boost_version = "1.69.0"
    protobuf_version = "3.15.5"
    requires = (
        "boost/{0}".format(boost_version),
        "protobuf/{0}".format(protobuf_version),
    )
    settings = "os", "build_type", "compiler", "arch"
    generators = "cmake"

    def configure(self):
        if (
            self.settings.compiler == "gcc"
            and self.settings.compiler.libcxx != "libstdc++11"
        ):
            raise ConanInvalidConfiguration(
                "gtirb requires libstdc++11 ABI, update your conan profile"
            )

    def build_requirements(self):
        if self.settings.os == "Windows":
            self.build_requires("ninja/1.10.2")

    def build(self):
        if self.settings.os == "Windows":
            with tools.vcvars(
                self.settings, force=True, filter_known_paths=False
            ):
                self.build_cmake()
        else:
            self.build_cmake()

    def build_cmake(self):
        # Note: Only build the C++ API
        defs = {
            "CMAKE_VERBOSE_MAKEFILE:BOOL": "ON",
            "ENABLE_CONAN:BOOL": "ON",
            "GTIRB_CXX_API:BOOL": "ON",
            "GTIRB_PY_API:BOOL": "OFF",
            "GTIRB_CL_API:BOOL": "OFF",
            "GTIRB_JAVA_API:BOOL": "OFF",
        }
        disable_parallel_build = (
            int(os.environ.get("GTIRB_DISABLE_PARALLEL_BUILD", "0")) != 0
        )
        if self.settings.os == "Windows":
            cmake = CMake(self, generator="Ninja")
            defs.update(
                {
                    k: os.environ.get(k)
                    for k in ["BOOST_ROOT", "CMAKE_PREFIX_PATH", "PYTHON"]
                }
            )
            defs.update({"Protobuf_USE_STATIC_LIBS": "ON"})
            if disable_parallel_build:
                defs["GTIRB_MSVC_PARALLEL_COMPILE_JOBS"] = "1"
        else:
            cmake = CMake(self, generator=None)
            defs.update({"GTIRB_STRIP_DEBUG_SYMBOLS:BOOL": "ON"})
        cmake.configure(
            source_folder=".",
            defs=defs,
        )
        if disable_parallel_build:
            cmake.parallel = False
        cmake.build()
        cmake.test(output_on_failure=True)
        cmake.install()
        # The patch_config_paths() function will change absolute paths in the
        # exported cmake config files to use the appropriate conan variables
        # instead.
        # It is an experimental feature of conan, however, so if you're having
        # trouble with paths in the cmake of the conan package, it could that
        # this function is no longer doing what we want.
        cmake.patch_config_paths()

    def package(self):
        pass

    def package_info(self):
        self.cpp_info.libs = ["gtirb"]

    def package_id(self):
        v = Version(str(self.settings.compiler.version))
        if self.settings.compiler == "Visual Studio" and v in ["15", "16"]:
            self.info.settings.compiler.version = "Visual Studio 15 and 16"


================================================
FILE: cpack-config.cmake
================================================
# Global properties
set(CMAKE_PROJECT_HOMEPAGE_URL https://github.com/GrammaTech/gtirb)
set(CPACK_COMPONENTS_GROUPING ALL_COMPONENTS_IN_ONE)

set(CPACK_DEB_COMPONENT_INSTALL ON)

# Reusable lists of components
set(LIB_COMPONENTS library license)
set(DEV_COMPONENTS headers proto_library cmake_config cmake_target)

# Debian packages
if("${CPACK_GTIRB_PACKAGE}" STREQUAL "debian-lib")
  set(CPACK_DEBIAN_PACKAGE_NAME "libgtirb")
  set(CPACK_DEBIAN_FILE_NAME DEB-DEFAULT)
  set(CPACK_COMPONENTS_ALL ${LIB_COMPONENTS})
  if("${CPACK_DEBIAN_PACKAGE_RELEASE}" STREQUAL "focal")
    set(CPACK_DEBIAN_PACKAGE_DEPENDS
        "libstdc++6, libc6, libgcc1, libprotobuf17"
    )
  elseif("${CPACK_DEBIAN_PACKAGE_RELEASE}" STREQUAL "jammy")
    set(CPACK_DEBIAN_PACKAGE_DEPENDS
        "libstdc++6, libc6, libgcc-s1, libprotobuf23"
    )
  elseif("${CPACK_DEBIAN_PACKAGE_RELEASE}" STREQUAL "noble")
    set(CPACK_DEBIAN_PACKAGE_DEPENDS
        "libstdc++6, libc6, libgcc-s1, libprotobuf32t64"
    )
  else()
    message(
      SEND_ERROR "Unknown / missing value for CPACK_DEBIAN_PACKAGE_RELEASE."
    )
  endif()
elseif("${CPACK_GTIRB_PACKAGE}" STREQUAL "debian-dev")
  set(CPACK_DEBIAN_PACKAGE_NAME "libgtirb-dev")
  set(CPACK_DEBIAN_FILE_NAME DEB-DEFAULT)
  set(CPACK_COMPONENTS_ALL ${DEV_COMPONENTS})
  set(CPACK_DEBIAN_PACKAGE_DEPENDS
      "libgtirb (=${CPACK_GTIRB_VERSION}-${CPACK_DEBIAN_PACKAGE_RELEASE}), libboost-dev (>=1.68) | libboost1.68-dev, libprotobuf-dev (>=${CPACK_PROTOBUF_VERSION_LOWER_BOUND}~), libprotobuf-dev (<<${CPACK_PROTOBUF_VERSION_UPPER_BOUND})"
  )
elseif("${CPACK_GTIRB_PACKAGE}" STREQUAL "debian-debug")
  set(CPACK_DEBIAN_PACKAGE_NAME "libgtirb-dbg")
  set(CPACK_DEBIAN_FILE_NAME DEB-DEFAULT)
  set(CPACK_COMPONENTS_ALL debug-file)
  set(CPACK_DEBIAN_PACKAGE_DEPENDS
      "libgtirb (=${CPACK_GTIRB_VERSION}-${CPACK_DEBIAN_PACKAGE_RELEASE})"
  )
endif()


================================================
FILE: doc/CFG-Edges.md
================================================
Advice on when to Place ICFG Edges
==================================

It is not always straightforward when to construct ICFG edges.  For
example, should there be an edge from a function's return to every
caller of that function?  While GTIRB does not preclude or enforce any
particular ICFG connection strategy, we do propose the following
suggestions for how to handle many common situations.

## Undefined/extern functions.

How to handle edges leaving call instructions to undefined or extern
functions?  In this case the function is not included in the module
and thus is not a possible edge target in the ICFG.

> ????

## Fall through edges from call sites.

Since we're working with an interprocedural CFG, we have edges from
call instructions to their targets. Do we also have edges from a call
instruction to the instruction immediately after it in memory?

> Yes unless we know the callee does not return (e.g., exit).

### Non-return functions.

When generating code around non-return functions (like exit):
sometimes compilers omit any following code if they know a call will
not return.  For example in a situation like this (except in machine
code):

```C
void foo()
{
    if (something) {
        bar_that_always_calls_exit();
        // stack cleanup
        return;
    }
}
```

In some cases, the compiler will know that
`bar_that_always_calls_exit()` will never return. In some cases, the
compiler doesn't figure that out. In the former case, the compiler may
omit the "stack cleanup" and "return" code. In the latter case, it
will not.

In some cases, your disassembly engine will know that
`bar_that_always_calls_exit()` will never return.  In some cases, your
disassembly engine doesn't figure that out.  In the former case, you
can choose to omit the "fall-through" edge in your IR. In the latter
case, you won't, because you think the execution flow is possible.

So, if you get the combination: the compiler figured it out and you
did *not*.  Then you will add the CFG edge from
`bar_that_always_calls_exit()` to whatever follows.  But whatever
follows will not necessarily be code in the function `foo()` or code
at all really.  It will be whatever random chunk of bytes the compiler
happened to plop down next.

We bring this up because it has bearing on your stance for adding
edges from callsites to their follows.  If you don't do that, you'll
never make this mistake.

However, we suggest that in the balance, having the edges when your
disassembly is correct outweighs the presence of this error.


## Edges from returns back to call sites.

What about from a return instruction to corresponding call sites
(plural) (or rather the instructions that follow them)?

> Yes.

## Edges from indirect calls to targets.

Indirect calls: we won't know who the targets are always. And we won't
know to add edges from corresponding return instructions.

> We put in edges (to and from) as we're able to identify them.  We
> don't conservatively put edges between every indirect call and every
> function.

## Tail calls.

Tail calls don't have return instructions or a place for a callee to
return to.

> Hook up the eventual return of a tail called function to the places
> it could lead (i.e., non tail-call callers and callers of tail-call
> callers).


================================================
FILE: doc/CMakeLists.txt
================================================
add_custom_target(doc)
file(MAKE_DIRECTORY "${CMAKE_CURRENT_BINARY_DIR}/html")

if(CXX_API)
  set(CPP_TAGFILE "${CMAKE_CURRENT_BINARY_DIR}/CPP_DOXY.tag")
  set(CPP_TAGFILE_RULE "${CPP_TAGFILE}=cpp")
  set(CPP_DOX_ENABLED "CPP_ONLY")
  set(CPP_API_VISIBLE "yes")
  add_subdirectory(cpp)
else()
  set(CPP_TAGFILE_RULE "")
  set(CPP_DOX_ENABLED "")
  set(CPP_API_VISIBLE "no")
endif()

if(PY_API)
  add_subdirectory(python)
  set(PY_DOX_ENABLED "PY_ONLY")
  set(PY_API_VISIBLE "yes")
else()
  set(PY_DOX_ENABLED "")
  set(PY_API_VISIBLE "no")
endif()

if(CL_API)
  add_subdirectory(cl)
  set(CL_DOX_ENABLED "CL_ONLY")
  set(CL_API_VISIBLE "yes")
else()
  set(CL_DOX_ENABLED "")
  set(CL_API_VISIBLE "no")
endif()

if(JAVA_API)
  add_subdirectory(java)
  set(JAVA_DOX_ENABLED "JAVA_ONLY")
  set(JAVA_API_VISIBLE "yes")
else()
  set(JAVA_DOX_ENABLED "")
  set(JAVA_API_VISIBLE "no")
endif()

add_subdirectory(examples)
add_subdirectory(general)


================================================
FILE: doc/binary-representation.md
================================================
Binary Representation with GTIRB
================================

- [Representing Binaries](#representing-binaries)
    - [Sections](#sections)
    - [Symbols](#symbols)
    - [Byte Intervals](#byte-intervals)
    - [Symbolic Expressions](#symbolic-expressions)

GTIRB portably encodes binaries from a range of standard executable
and linkable formats, such as
[ELF](https://en.wikipedia.org/wiki/Executable_and_Linkable_Format),
[PE](https://en.wikipedia.org/wiki/Portable_Executable), and
[Mach-O](https://en.wikipedia.org/wiki/Mach-O), allowing conversion to
and from these formats to GTIRB.  In ensure all information from the
original binary is retained despite standard GTIRB data
structures--which are intended to be general across all binary
representations--being lossy for many aspects of particular
representation, encoders are encouraged to include all raw bytes of
the original file in the GTIRB encoding.  In addition, GTIRB encodes
information above and beyond what these formats store; it stores
control flow, symbolization (reference) information, and other
analysis results, with the goal of providing all essential information
to support subsequent binary analysis and rewriting. Finally, GTIRB
allows user-extensible data to be included in the form of AuxData
tables which can easily reference other GTIRB elements--letting tools
communicate with each other in a single standard in-file format.

## Representing Binaries

Although executable file formats differ in many ways, they typically
tend to have a similar structure.  The bytes of the image are divided
into sections, which contain the bytes consisting of the code and data
along with information about how to load and adjust them at run-time.
To facilitate linking with shared libraries, they have a symbol table,
which specifies a list of names of entities this file provides or
requires.  To facilitate relocation in memory these files often
contains a relocation table.

GTIRB contains all this information in standard forms.  In GTIRB, a
single executable or library is encoded as a *module*.  A GTIRB file
may have multiple modules, enclosed in a single *IR*.  GTIRB encodes
the standard features of all binary formats in the following
structures:

### Sections

Modules in GTIRB contain multiple *sections*.  A section has a name
reflecting any name given in the original file (e.g., `.text`), a set
of properties, and a set of contents stored in
[byte intervals](#byte-intervals).

### Symbols

Rather than storing a symbol table as a section, GTIRB stores a set of
*symbols* associated with every module.  These symbols have a name, a
set of properties, and a *referent*.  A referent may be an integer,
indicating that the symbol is a numeric constant or fixed address, or
a reference to a *block*. A block may be one of:

| Block Kind    | Description                                             |
|---------------|---------------------------------------------------------|
| *code block*  | a series of executable instructions                     |
| *data block*  | a series of data bytes                                  |
| *proxy block* | indicating that the symbol is defined in another module |

### Byte Intervals

The bytes of a section are subdivided into chunks of bytes called
*byte intervals*. This indirection layer serves two purposes:

- Indicate what blocks can be moved independently of each other. It is
  guaranteed that you can shuffle around two byte intervals in a
  section, and doing so will preserve the program's semantics.
- Support the generation of blocks with no original address. Byte
  intervals may have a fixed address, but they may also be unfixed,
  likely indicating that the byte interval was generated by a binary
  rewriting tool or is freely movable to any address.

Two byte intervals in the same section may not overlap in addresses
(although sections can overlap with each other in some cases, such as
in object code).  Byte intervals contain code blocks or data blocks.
The blocks within a byte interval *can* overlap.  Examples of
overlapping blocks include:

- Overlapping data blocks are common.
  - One data block may representing an array may overlap many data
    blocks representing elements of the array.
  - Compilers often overlap strings with shared suffixes.  The data
    blocks representing these strings will similarly overlap.
* Overlapping code blocks are rare, however particularly clever or
  malicious code blocks in variable-width ISAs may overlap when two
  different sequences of instructions serialize to machine-code bytes
  which share common subsequences.

Byte intervals also hold [symbolic expressions](#symbolic-expressions)
which indicate symbolic contents of code or data blocks.

### Symbolic Expressions

To encode relocations, GTIRB associates *symbolic expressions* with
byte-intervals.  These specify that certain bytes in the binary refer
to the address.  This allows these bytes to be recalculated when the
referent is moved in the binary image.

GTIRB does not specify exactly how symbolic expressions are
transformed into bytes. This depends on where the symbolic expression
is located; inside a code block, it depends on what part of an
instruction it is of, while inside a data block, it depends on the
size of the data block.

There are currently three kinds of symbolic expressions:

| Kind            | Description       |
|-----------------|-------------------|
| *SymAddrConst*  | the address of the referent of a symbol, plus or minus a fixed offset     |
| *SymAddrAddr*   | the difference between two symbols, divided by a scale and plus an offset |


================================================
FILE: doc/cl/CMakeLists.txt
================================================
set(SDT_SCRIPT ${CMAKE_CURRENT_SOURCE_DIR}/write-documentation.lisp)
set(README ${CMAKE_SOURCE_DIR}/cl/README.md)
set(HTML_INDEX ${CMAKE_BINARY_DIR}/doc/html/cl/index.html)

file(MAKE_DIRECTORY "${CMAKE_BINARY_DIR}/doc/html/cl")
file(GLOB CL_SOURCES ${CMAKE_SOURCE_DIR}/cl/*.lisp ${CMAKE_SOURCE_DIR}/cl/*.asd)

add_custom_command(
  OUTPUT ${HTML_INDEX}
  DEPENDS ${SDT_SCRIPT} ${README} ${CL_SOURCES}
  COMMAND
    ${LISP} --noinform --dynamic-space-size 16384 --no-userinit --no-sysinit
    --disable-debugger --load ${QUICKLISP}/setup.lisp --eval
    "(asdf:initialize-source-registry `(:source-registry (:tree \"${CMAKE_SOURCE_DIR}/cl\") :inherit-configuration))"
    --script ${SDT_SCRIPT} gtirb ${README} ${HTML_INDEX}
  VERBATIM
  COMMENT "Generating API documentation with SDT"
)
add_custom_target(sdt ALL DEPENDS ${HTML_INDEX})
add_dependencies(doc sdt)


================================================
FILE: doc/cl/write-documentation.lisp
================================================
;; -*- lisp -*-
;;
;; Usage: write-documentation PKG ABSTRACT OUTPUT-HTML
;;   Write the automatically generated documentation for PKG to
;;   OUTPUT-HTML.  The ABSTRACT should be a file in Markdown format to
;;   place at the top of the generated documentation.
;;
(load "~/.sbclrc" :if-does-not-exist nil)
(ql:quickload :alexandria)
(ql:quickload :simpler-documentation-template)
(ql:quickload :markdown.cl)
(unless (= (length sb-ext:*posix-argv*) 5)
  (format t "Usage: write-documentation PKG ABSTRACT OUTPUT-HTML"))
(let ((package (alexandria:make-keyword
                (string-upcase (second sb-ext:*posix-argv*))))
      (abstract-path (third sb-ext:*posix-argv*))
      (output-path (fourth sb-ext:*posix-argv*)))
  (ql:quickload package)
  #+debug (format t "Writing: ~S~%" (list package abstract-path output-path))
  (simpler-documentation-template:create-template
   package
   :maybe-skip-methods-p t
   :target output-path
   :abstract-html (markdown.cl:parse
                   (with-open-file (in abstract-path)
                     (let* ((file-bytes (file-length in))
                            (seq (make-string file-bytes))
                            (file-chars (read-sequence seq in)))
                       (subseq seq 0 file-chars))))))


================================================
FILE: doc/cpp/CMakeLists.txt
================================================
# based on sample in https://majewsky.wordpress.com/2010/08/14/tip-of-the-day-
# cmake-and-doxygen/ add a target to generate API documentation with Doxygen

cmake_minimum_required(VERSION 3.3)

find_package(Doxygen)
if(DOXYGEN_FOUND)

  set(ROOTDIR "${CMAKE_CURRENT_SOURCE_DIR}/../..")
  set(DOTDIR "${CMAKE_CURRENT_SOURCE_DIR}/../dot")

  set(BUILDFILES_IN ../preprocmd.py DoxygenLayout.xml)
  foreach(_inf ${BUILDFILES_IN})
    configure_file(
      ${CMAKE_CURRENT_SOURCE_DIR}/${_inf} ${CMAKE_CURRENT_BINARY_DIR}/${_inf}
      @ONLY
    )
  endforeach()

  # Handle version initialization
  file(READ "${ROOTDIR}/version.txt" ver)

  string(REGEX MATCH "VERSION_MAJOR ([0-9]*)" _ ${ver})
  set(GTIRB_MAJOR_VERSION ${CMAKE_MATCH_1})

  string(REGEX MATCH "VERSION_MINOR ([0-9]*)" _ ${ver})
  set(GTIRB_MINOR_VERSION ${CMAKE_MATCH_1})

  string(REGEX MATCH "VERSION_PATCH ([0-9]*)" _ ${ver})
  set(GTIRB_PATCH_VERSION ${CMAKE_MATCH_1})

  configure_file(
    "${ROOTDIR}/include/gtirb/version.h.in"
    "${ROOTDIR}/include/gtirb/version.h" @ONLY
  )

  configure_file(
    "${CMAKE_CURRENT_SOURCE_DIR}/Doxyfile.in"
    "${CMAKE_CURRENT_BINARY_DIR}/Doxyfile" @ONLY
  )

  # adapted from https://gist.github.com/abravalheri/11214134

  macro(move_filename file_list newdir)
    foreach(src_file ${${file_list}})
      get_filename_component(src_file_name "${src_file}" NAME)
      list(REMOVE_ITEM ${file_list} "${src_file}")
      list(APPEND ${file_list} "${newdir}/${src_file_name}")
    endforeach()
  endmacro()

  # ----------------------------------------------------------------------
  # copy dot files into a subdir of the working directory
  # ----------------------------------------------------------------------
  file(GLOB DOTFILES_IN "${DOTDIR}/*")

  set(DOTFILES ${DOTFILES_IN})
  move_filename(DOTFILES ${CMAKE_CURRENT_BINARY_DIR})

  # message("DOTFILES = ${DOTFILES}")

  add_custom_command(
    OUTPUT ${DOTFILES}
    WORKING_DIRECTORY ${CMAKE_CURRENT_BINARY_DIR}
    DEPENDS ${DOTFILES_IN}
    COMMAND mkdir -p dot
    COMMAND ${CMAKE_COMMAND} -E copy_directory ${DOTDIR} dot
    COMMENT "copying dot dir"
    VERBATIM
  )

  # ----------------------------------------------------------------------
  # copy md files into the working directory
  # ----------------------------------------------------------------------

  set(MDFILES_IN "${CMAKE_CURRENT_SOURCE_DIR}/README.md")

  set(MDFILES ${MDFILES_IN})
  move_filename(MDFILES ${CMAKE_CURRENT_BINARY_DIR})
  # message("MDFILES = ${MDFILES}")

  gtirb_find_python()

  foreach(_inmd ${MDFILES_IN})
    get_filename_component(_outmd "${_inmd}" NAME)
    add_custom_command(
      OUTPUT ${_outmd}
      WORKING_DIRECTORY ${CMAKE_CURRENT_BINARY_DIR}
      DEPENDS ${_inmd}
      COMMAND ${CMAKE_COMMAND} -E copy ${_inmd} "${_outmd}.in"
      COMMAND ${PYTHON} ../preprocmd.py "${_outmd}.in" ${_outmd}
      COMMENT "processing ${_outmd}"
      VERBATIM
    )
  endforeach()

  # ----------------------------------------------------------------------
  # Main target
  # ----------------------------------------------------------------------

  add_custom_target(
    cpp_doxyout
    WORKING_DIRECTORY ${CMAKE_CURRENT_BINARY_DIR}
    DEPENDS ${DOTFILES}
    DEPENDS ${MDFILES}
    COMMAND ${DOXYGEN_EXECUTABLE} ${CMAKE_CURRENT_BINARY_DIR}/Doxyfile
    COMMENT "Generating C++ API documentation with Doxygen"
    VERBATIM
  )

  add_dependencies(doc cpp_doxyout)
endif(DOXYGEN_FOUND)


================================================
FILE: doc/cpp/Doxyfile.in
================================================
# Doxyfile 1.8.11

# This file describes the settings to be used by the documentation system
# doxygen (www.doxygen.org) for a project.
#
# All text after a double hash (##) is considered a comment and is placed in
# front of the TAG it is preceding.
#
# All text after a single hash (#) is considered a comment and will be ignored.
# The format is:
# TAG = value [value, ...]
# For lists, items can also be appended using:
# TAG += value [value, ...]
# Values that contain spaces should be placed between quotes (\" \").

#---------------------------------------------------------------------------
# Project related configuration options
#---------------------------------------------------------------------------

# This tag specifies the encoding used for all characters in the config file
# that follow. The default is UTF-8 which is also the encoding used for all text
# before the first occurrence of this tag. Doxygen uses libiconv (or the iconv
# built into libc) for the transcoding. See http://www.gnu.org/software/libiconv
# for the list of possible encodings.
# The default value is: UTF-8.

DOXYFILE_ENCODING      = UTF-8

# The PROJECT_NAME tag is a single word (or a sequence of words surrounded by
# double-quotes, unless you are using Doxywizard) that should identify the
# project for which the documentation is generated. This name is used in the
# title of most generated pages and in a few other places.
# The default value is: My Project.

PROJECT_NAME           = GTIRB

# The PROJECT_NUMBER tag can be used to enter a project or revision number. This
# could be handy for archiving the generated documentation or if some version
# control system is used.

PROJECT_NUMBER         = v@GTIRB_MAJOR_VERSION@.@GTIRB_MINOR_VERSION@.@GTIRB_PATCH_VERSION@

# Using the PROJECT_BRIEF tag one can provide an optional one line description
# for a project that appears at the top of each page and should give viewer a
# quick idea about the purpose of the project. Keep the description short.

PROJECT_BRIEF          = "GrammaTech Intermediate Representation for Binaries: C++ API"

# With the PROJECT_LOGO tag one can specify a logo or an icon that is included
# in the documentation. The maximum height of the logo should not exceed 55
# pixels and the maximum width should not exceed 200 pixels. Doxygen will copy
# the logo to the output directory.

PROJECT_LOGO           =

# The OUTPUT_DIRECTORY tag is used to specify the (relative or absolute) path
# into which the generated documentation will be written. If a relative path is
# entered, it will be relative to the location where doxygen was started. If
# left blank the current directory will be used.

OUTPUT_DIRECTORY       = @CMAKE_BINARY_DIR@/doc

# If the CREATE_SUBDIRS tag is set to YES then doxygen will create 4096 sub-
# directories (in 2 levels) under the output directory of each output format and
# will distribute the generated files over these directories. Enabling this
# option can be useful when feeding doxygen a huge amount of source files, where
# putting all generated files in the same directory would otherwise causes
# performance problems for the file system.
# The default value is: NO.

CREATE_SUBDIRS         = NO

# If the ALLOW_UNICODE_NAMES tag is set to YES, doxygen will allow non-ASCII
# characters to appear in the names of generated files. If set to NO, non-ASCII
# characters will be escaped, for example _xE3_x81_x84 will be used for Unicode
# U+3044.
# The default value is: NO.

ALLOW_UNICODE_NAMES    = NO

# The OUTPUT_LANGUAGE tag is used to specify the language in which all
# documentation generated by doxygen is written. Doxygen will use this
# information to generate all constant output in the proper language.
# Possible values are: Afrikaans, Arabic, Armenian, Brazilian, Catalan, Chinese,
# Chinese-Traditional, Croatian, Czech, Danish, Dutch, English (United States),
# Esperanto, Farsi (Persian), Finnish, French, German, Greek, Hungarian,
# Indonesian, Italian, Japanese, Japanese-en (Japanese with English messages),
# Korean, Korean-en (Korean with English messages), Latvian, Lithuanian,
# Macedonian, Norwegian, Persian (Farsi), Polish, Portuguese, Romanian, Russian,
# Serbian, Serbian-Cyrillic, Slovak, Slovene, Spanish, Swedish, Turkish,
# Ukrainian and Vietnamese.
# The default value is: English.

OUTPUT_LANGUAGE        = English

# If the BRIEF_MEMBER_DESC tag is set to YES, doxygen will include brief member
# descriptions after the members that are listed in the file and class
# documentation (similar to Javadoc). Set to NO to disable this.
# The default value is: YES.

BRIEF_MEMBER_DESC      = YES

# If the REPEAT_BRIEF tag is set to YES, doxygen will prepend the brief
# description of a member or function before the detailed description
#
# Note: If both HIDE_UNDOC_MEMBERS and BRIEF_MEMBER_DESC are set to NO, the
# brief descriptions will be completely suppressed.
# The default value is: YES.

REPEAT_BRIEF           = YES

# This tag implements a quasi-intelligent brief description abbreviator that is
# used to form the text in various listings. Each string in this list, if found
# as the leading text of the brief description, will be stripped from the text
# and the result, after processing the whole list, is used as the annotated
# text. Otherwise, the brief description is used as-is. If left blank, the
# following values are used ($name is automatically replaced with the name of
# the entity):The $name class, The $name widget, The $name file, is, provides,
# specifies, contains, represents, a, an and the.

ABBREVIATE_BRIEF       = "The $name class" \
                         "The $name widget" \
                         "The $name file" \
                         is \
                         provides \
                         specifies \
                         contains \
                         represents \
                         a \
                         an \
                         the

# If the ALWAYS_DETAILED_SEC and REPEAT_BRIEF tags are both set to YES then
# doxygen will generate a detailed section even if there is only a brief
# description.
# The default value is: NO.

ALWAYS_DETAILED_SEC    = NO

# If the INLINE_INHERITED_MEMB tag is set to YES, doxygen will show all
# inherited members of a class in the documentation of that class as if those
# members were ordinary class members. Constructors, destructors and assignment
# operators of the base classes will not be shown.
# The default value is: NO.

INLINE_INHERITED_MEMB  = NO

# If the FULL_PATH_NAMES tag is set to YES, doxygen will prepend the full path
# before files name in the file list and in the header files. If set to NO the
# shortest path that makes the file name unique will be used
# The default value is: YES.

FULL_PATH_NAMES        = NO

# The STRIP_FROM_PATH tag can be used to strip a user-defined part of the path.
# Stripping is only done if one of the specified strings matches the left-hand
# part of the path. The tag can be used to show relative paths in the file list.
# If left blank the directory from which doxygen is run is used as the path to
# strip.
#
# Note that you can specify absolute paths here, but also relative paths, which
# will be relative from the directory where doxygen is started.
# This tag requires that the tag FULL_PATH_NAMES is set to YES.

STRIP_FROM_PATH        = .

# The STRIP_FROM_INC_PATH tag can be used to strip a user-defined part of the
# path mentioned in the documentation of a class, which tells the reader which
# header file to include in order to use a class. If left blank only the name of
# the header file containing the class definition is used. Otherwise one should
# specify the list of include paths that are normally passed to the compiler
# using the -I flag.

STRIP_FROM_INC_PATH    =

# If the SHORT_NAMES tag is set to YES, doxygen will generate much shorter (but
# less readable) file names. This can be useful is your file systems doesn't
# support long names like on DOS, Mac, or CD-ROM.
# The default value is: NO.

SHORT_NAMES            = NO

# If the JAVADOC_AUTOBRIEF tag is set to YES then doxygen will interpret the
# first line (until the first dot) of a Javadoc-style comment as the brief
# description. If set to NO, the Javadoc-style will behave just like regular Qt-
# style comments (thus requiring an explicit @brief command for a brief
# description.)
# The default value is: NO.

JAVADOC_AUTOBRIEF      = NO

# If the QT_AUTOBRIEF tag is set to YES then doxygen will interpret the first
# line (until the first dot) of a Qt-style comment as the brief description. If
# set to NO, the Qt-style will behave just like regular Qt-style comments (thus
# requiring an explicit \brief command for a brief description.)
# The default value is: NO.

QT_AUTOBRIEF           = NO

# The MULTILINE_CPP_IS_BRIEF tag can be set to YES to make doxygen treat a
# multi-line C++ special comment block (i.e. a block of //! or /// comments) as
# a brief description. This used to be the default behavior. The new default is
# to treat a multi-line C++ comment block as a detailed description. Set this
# tag to YES if you prefer the old behavior instead.
#
# Note that setting this tag to YES also means that rational rose comments are
# not recognized any more.
# The default value is: NO.

MULTILINE_CPP_IS_BRIEF = NO

# If the INHERIT_DOCS tag is set to YES then an undocumented member inherits the
# documentation from any documented member that it re-implements.
# The default value is: YES.

INHERIT_DOCS           = YES

# If the SEPARATE_MEMBER_PAGES tag is set to YES then doxygen will produce a new
# page for each member. If set to NO, the documentation of a member will be part
# of the file/class/namespace that contains it.
# The default value is: NO.

SEPARATE_MEMBER_PAGES  = NO

# The TAB_SIZE tag can be used to set the number of spaces in a tab. Doxygen
# uses this value to replace tabs by spaces in code fragments.
# Minimum value: 1, maximum value: 16, default value: 4.

TAB_SIZE               = 4

# This tag can be used to specify a number of aliases that act as commands in
# the documentation. An alias has the form:
# name=value
# For example adding
# "sideeffect=@par Side Effects:\n"
# will allow you to put the command \sideeffect (or @sideeffect) in the
# documentation, which will result in a user-defined paragraph with heading
# "Side Effects:". You can put \n's in the value part of an alias to insert
# newlines.

ALIASES                =

# This tag can be used to specify a number of word-keyword mappings (TCL only).
# A mapping has the form "name=value". For example adding "class=itcl::class"
# will allow you to use the command class in the itcl::class meaning.

TCL_SUBST              =

# Set the OPTIMIZE_OUTPUT_FOR_C tag to YES if your project consists of C sources
# only. Doxygen will then generate output that is more tailored for C. For
# instance, some of the names that are used will be different. The list of all
# members will be omitted, etc.
# The default value is: NO.

OPTIMIZE_OUTPUT_FOR_C  = NO

# Set the OPTIMIZE_OUTPUT_JAVA tag to YES if your project consists of Java or
# Python sources only. Doxygen will then generate output that is more tailored
# for that language. For instance, namespaces will be presented as packages,
# qualified scopes will look different, etc.
# The default value is: NO.

OPTIMIZE_OUTPUT_JAVA   = NO

# Set the OPTIMIZE_FOR_FORTRAN tag to YES if your project consists of Fortran
# sources. Doxygen will then generate output that is tailored for Fortran.
# The default value is: NO.

OPTIMIZE_FOR_FORTRAN   = NO

# Set the OPTIMIZE_OUTPUT_VHDL tag to YES if your project consists of VHDL
# sources. Doxygen will then generate output that is tailored for VHDL.
# The default value is: NO.

OPTIMIZE_OUTPUT_VHDL   = NO

# Doxygen selects the parser to use depending on the extension of the files it
# parses. With this tag you can assign which parser to use for a given
# extension. Doxygen has a built-in mapping, but you can override or extend it
# using this tag. The format is ext=language, where ext is a file extension, and
# language is one of the parsers supported by doxygen: IDL, Java, Javascript,
# C#, C, C++, D, PHP, Objective-C, Python, Fortran (fixed format Fortran:
# FortranFixed, free formatted Fortran: FortranFree, unknown formatted Fortran:
# Fortran. In the later case the parser tries to guess whether the code is fixed
# or free formatted code, this is the default for Fortran type files), VHDL. For
# instance to make doxygen treat .inc files as Fortran files (default is PHP),
# and .f files as C (default is Fortran), use: inc=Fortran f=C.
#
# Note: For files without extension you can use no_extension as a placeholder.
#
# Note that for custom extensions you also need to set FILE_PATTERNS otherwise
# the files are not read by doxygen.

EXTENSION_MAPPING      =

# If the MARKDOWN_SUPPORT tag is enabled then doxygen pre-processes all comments
# according to the Markdown format, which allows for more readable
# documentation. See http://daringfireball.net/projects/markdown/ for details.
# The output of markdown processing is further processed by doxygen, so you can
# mix doxygen, HTML, and XML commands with Markdown formatting. Disable only in
# case of backward compatibilities issues.
# The default value is: YES.

MARKDOWN_SUPPORT       = YES

# When enabled doxygen tries to link words that correspond to documented
# classes, or namespaces to their corresponding documentation. Such a link can
# be prevented in individual cases by putting a % sign in front of the word or
# globally by setting AUTOLINK_SUPPORT to NO.
# The default value is: YES.

AUTOLINK_SUPPORT       = YES

# If you use STL classes (i.e. std::string, std::vector, etc.) but do not want
# to include (a tag file for) the STL sources as input, then you should set this
# tag to YES in order to let doxygen match functions declarations and
# definitions whose arguments contain STL classes (e.g. func(std::string);
# versus func(std::string) {}). This also make the inheritance and collaboration
# diagrams that involve STL classes more complete and accurate.
# The default value is: NO.

BUILTIN_STL_SUPPORT    = NO

# If you use Microsoft's C++/CLI language, you should set this option to YES to
# enable parsing support.
# The default value is: NO.

CPP_CLI_SUPPORT        = NO

# Set the SIP_SUPPORT tag to YES if your project consists of sip (see:
# http://www.riverbankcomputing.co.uk/software/sip/intro) sources only. Doxygen
# will parse them like normal C++ but will assume all classes use public instead
# of private inheritance when no explicit protection keyword is present.
# The default value is: NO.

SIP_SUPPORT            = NO

# For Microsoft's IDL there are propget and propput attributes to indicate
# getter and setter methods for a property. Setting this option to YES will make
# doxygen to replace the get and set methods by a property in the documentation.
# This will only work if the methods are indeed getting or setting a simple
# type. If this is not the case, or you want to show the methods anyway, you
# should set this option to NO.
# The default value is: YES.

IDL_PROPERTY_SUPPORT   = YES

# If member grouping is used in the documentation and the DISTRIBUTE_GROUP_DOC
# tag is set to YES then doxygen will reuse the documentation of the first
# member in the group (if any) for the other members of the group. By default
# all members of a group must be documented explicitly.
# The default value is: NO.

DISTRIBUTE_GROUP_DOC   = NO

# If one adds a struct or class to a group and this option is enabled, then also
# any nested class or struct is added to the same group. By default this option
# is disabled and one has to add nested compounds explicitly via \ingroup.
# The default value is: NO.

GROUP_NESTED_COMPOUNDS = NO

# Set the SUBGROUPING tag to YES to allow class member groups of the same type
# (for instance a group of public functions) to be put as a subgroup of that
# type (e.g. under the Public Functions section). Set it to NO to prevent
# subgrouping. Alternatively, this can be done per class using the
# \nosubgrouping command.
# The default value is: YES.

SUBGROUPING            = YES

# When the INLINE_GROUPED_CLASSES tag is set to YES, classes, structs and unions
# are shown inside the group in which they are included (e.g. using \ingroup)
# instead of on a separate page (for HTML and Man pages) or section (for LaTeX
# and RTF).
#
# Note that this feature does not work in combination with
# SEPARATE_MEMBER_PAGES.
# The default value is: NO.

INLINE_GROUPED_CLASSES = NO

# When the INLINE_SIMPLE_STRUCTS tag is set to YES, structs, classes, and unions
# with only public data fields or simple typedef fields will be shown inline in
# the documentation of the scope in which they are defined (i.e. file,
# namespace, or group documentation), provided this scope is documented. If set
# to NO, structs, classes, and unions are shown on a separate page (for HTML and
# Man pages) or section (for LaTeX and RTF).
# The default value is: NO.

INLINE_SIMPLE_STRUCTS  = NO

# When TYPEDEF_HIDES_STRUCT tag is enabled, a typedef of a struct, union, or
# enum is documented as struct, union, or enum with the name of the typedef. So
# typedef struct TypeS {} TypeT, will appear in the documentation as a struct
# with name TypeT. When disabled the typedef will appear as a member of a file,
# namespace, or class. And the struct will be named TypeS. This can typically be
# useful for C code in case the coding convention dictates that all compound
# types are typedef'ed and only the typedef is referenced, never the tag name.
# The default value is: NO.

TYPEDEF_HIDES_STRUCT   = YES

# The size of the symbol lookup cache can be set using LOOKUP_CACHE_SIZE. This
# cache is used to resolve symbols given their name and scope. Since this can be
# an expensive process and often the same symbol appears multiple times in the
# code, doxygen keeps a cache of pre-resolved symbols. If the cache is too small
# doxygen will become slower. If the cache is too large, memory is wasted. The
# cache size is given by this formula: 2^(16+LOOKUP_CACHE_SIZE). The valid range
# is 0..9, the default is 0, corresponding to a cache size of 2^16=65536
# symbols. At the end of a run doxygen will report the cache usage and suggest
# the optimal cache size from a speed point of view.
# Minimum value: 0, maximum value: 9, default value: 0.

LOOKUP_CACHE_SIZE      = 0

#---------------------------------------------------------------------------
# Build related configuration options
#---------------------------------------------------------------------------

# If the EXTRACT_ALL tag is set to YES, doxygen will assume all entities in
# documentation are documented, even if no documentation was available. Private
# class members and static file members will be hidden unless the
# EXTRACT_PRIVATE respectively EXTRACT_STATIC tags are set to YES.
# Note: This will also disable the warnings about undocumented members that are
# normally produced when WARNINGS is set to YES.
# The default value is: NO.

EXTRACT_ALL            = YES

# If the EXTRACT_PRIVATE tag is set to YES, all private members of a class will
# be included in the documentation.
# The default value is: NO.

EXTRACT_PRIVATE        = NO

# If the EXTRACT_PACKAGE tag is set to YES, all members with package or internal
# scope will be included in the documentation.
# The default value is: NO.

EXTRACT_PACKAGE        = NO

# If the EXTRACT_STATIC tag is set to YES, all static members of a file will be
# included in the documentation.
# The default value is: NO.

EXTRACT_STATIC         = NO

# If the EXTRACT_LOCAL_CLASSES tag is set to YES, classes (and structs) defined
# locally in source files will be included in the documentation. If set to NO,
# only classes defined in header files are included. Does not have any effect
# for Java sources.
# The default value is: YES.

EXTRACT_LOCAL_CLASSES  = YES

# This flag is only useful for Objective-C code. If set to YES, local methods,
# which are defined in the implementation section but not in the interface are
# included in the documentation. If set to NO, only methods in the interface are
# included.
# The default value is: NO.

EXTRACT_LOCAL_METHODS  = NO

# If this flag is set to YES, the members of anonymous namespaces will be
# extracted and appear in the documentation as a namespace called
# 'anonymous_namespace{file}', where file will be replaced with the base name of
# the file that contains the anonymous namespace. By default anonymous namespace
# are hidden.
# The default value is: NO.

EXTRACT_ANON_NSPACES   = YES

# If the HIDE_UNDOC_MEMBERS tag is set to YES, doxygen will hide all
# undocumented members inside documented classes or files. If set to NO these
# members will be included in the various overviews, but no documentation
# section is generated. This option has no effect if EXTRACT_ALL is enabled.
# The default value is: NO.

HIDE_UNDOC_MEMBERS     = NO

# If the HIDE_UNDOC_CLASSES tag is set to YES, doxygen will hide all
# undocumented classes that are normally visible in the class hierarchy. If set
# to NO, these classes will be included in the various overviews. This option
# has no effect if EXTRACT_ALL is enabled.
# The default value is: NO.

HIDE_UNDOC_CLASSES     = NO

# If the HIDE_FRIEND_COMPOUNDS tag is set to YES, doxygen will hide all friend
# (class|struct|union) declarations. If set to NO, these declarations will be
# included in the documentation.
# The default value is: NO.

HIDE_FRIEND_COMPOUNDS  = NO

# If the HIDE_IN_BODY_DOCS tag is set to YES, doxygen will hide any
# documentation blocks found inside the body of a function. If set to NO, these
# blocks will be appended to the function's detailed documentation block.
# The default value is: NO.

HIDE_IN_BODY_DOCS      = NO

# The INTERNAL_DOCS tag determines if documentation that is typed after a
# \internal command is included. If the tag is set to NO then the documentation
# will be excluded. Set it to YES to include the internal documentation.
# The default value is: NO.

INTERNAL_DOCS          = NO

# If the CASE_SENSE_NAMES tag is set to NO then doxygen will only generate file
# names in lower-case letters. If set to YES, upper-case letters are also
# allowed. This is useful if you have classes or files whose names only differ
# in case and if your file system supports case sensitive file names. Windows
# and Mac users are advised to set this option to NO.
# The default value is: system dependent.

CASE_SENSE_NAMES       = NO

# If the HIDE_SCOPE_NAMES tag is set to NO then doxygen will show members with
# their full class and namespace scopes in the documentation. If set to YES, the
# scope will be hidden.
# The default value is: NO.

HIDE_SCOPE_NAMES       = NO

# If the HIDE_COMPOUND_REFERENCE tag is set to NO (default) then doxygen will
# append additional text to a page's title, such as Class Reference. If set to
# YES the compound reference will be hidden.
# The default value is: NO.

HIDE_COMPOUND_REFERENCE= NO

# If the SHOW_INCLUDE_FILES tag is set to YES then doxygen will put a list of
# the files that are included by a file in the documentation of that file.
# The default value is: YES.

SHOW_INCLUDE_FILES     = YES

# If the SHOW_GROUPED_MEMB_INC tag is set to YES then Doxygen will add for each
# grouped member an include statement to the documentation, telling the reader
# which file to include in order to use the member.
# The default value is: NO.

SHOW_GROUPED_MEMB_INC  = YES

# If the FORCE_LOCAL_INCLUDES tag is set to YES then doxygen will list include
# files with double quotes in the documentation rather than with sharp brackets.
# The default value is: NO.

FORCE_LOCAL_INCLUDES   = NO

# If the INLINE_INFO tag is set to YES then a tag [inline] is inserted in the
# documentation for inline members.
# The default value is: YES.

INLINE_INFO            = YES

# If the SORT_MEMBER_DOCS tag is set to YES then doxygen will sort the
# (detailed) documentation of file and class members alphabetically by member
# name. If set to NO, the members will appear in declaration order.
# The default value is: YES.

SORT_MEMBER_DOCS       = YES

# If the SORT_BRIEF_DOCS tag is set to YES then doxygen will sort the brief
# descriptions of file, namespace and class members alphabetically by member
# name. If set to NO, the members will appear in declaration order. Note that
# this will also influence the order of the classes in the class list.
# The default value is: NO.

SORT_BRIEF_DOCS        = YES

# If the SORT_MEMBERS_CTORS_1ST tag is set to YES then doxygen will sort the
# (brief and detailed) documentation of class members so that constructors and
# destructors are listed first. If set to NO the constructors will appear in the
# respective orders defined by SORT_BRIEF_DOCS and SORT_MEMBER_DOCS.
# Note: If SORT_BRIEF_DOCS is set to NO this option is ignored for sorting brief
# member documentation.
# Note: If SORT_MEMBER_DOCS is set to NO this option is ignored for sorting
# detailed member documentation.
# The default value is: NO.

SORT_MEMBERS_CTORS_1ST = YES

# If the SORT_GROUP_NAMES tag is set to YES then doxygen will sort the hierarchy
# of group names into alphabetical order. If set to NO the group names will
# appear in their defined order.
# The default value is: NO.

SORT_GROUP_NAMES       = YES

# If the SORT_BY_SCOPE_NAME tag is set to YES, the class list will be sorted by
# fully-qualified names, including namespaces. If set to NO, the class list will
# be sorted only by class name, not including the namespace part.
# Note: This option is not very useful if HIDE_SCOPE_NAMES is set to YES.
# Note: This option applies only to the class list, not to the alphabetical
# list.
# The default value is: NO.

SORT_BY_SCOPE_NAME     = NO

# If the STRICT_PROTO_MATCHING option is enabled and doxygen fails to do proper
# type resolution of all parameters of a function it will reject a match between
# the prototype and the implementation of a member function even if there is
# only one candidate or it is obvious which candidate to choose by doing a
# simple string match. By disabling STRICT_PROTO_MATCHING doxygen will still
# accept a match between prototype and implementation in such cases.
# The default value is: NO.

STRICT_PROTO_MATCHING  = NO

# The GENERATE_TODOLIST tag can be used to enable (YES) or disable (NO) the todo
# list. This list is created by putting \todo commands in the documentation.
# The default value is: YES.

GENERATE_TODOLIST      = YES

# The GENERATE_TESTLIST tag can be used to enable (YES) or disable (NO) the test
# list. This list is created by putting \test commands in the documentation.
# The default value is: YES.

GENERATE_TESTLIST      = YES

# The GENERATE_BUGLIST tag can be used to enable (YES) or disable (NO) the bug
# list. This list is created by putting \bug commands in the documentation.
# The default value is: YES.

GENERATE_BUGLIST       = YES

# The GENERATE_DEPRECATEDLIST tag can be used to enable (YES) or disable (NO)
# the deprecated list. This list is created by putting \deprecated commands in
# the documentation.
# The default value is: YES.

GENERATE_DEPRECATEDLIST= YES

# The ENABLED_SECTIONS tag can be used to enable conditional documentation
# sections, marked by \if <section_label> ... \endif and \cond <section_label>
# ... \endcond blocks.

ENABLED_SECTIONS       =

# The MAX_INITIALIZER_LINES tag determines the maximum number of lines that the
# initial value of a variable or macro / define can have for it to appear in the
# documentation. If the initializer consists of more lines than specified here
# it will be hidden. Use a value of 0 to hide initializers completely. The
# appearance of the value of individual variables and macros / defines can be
# controlled using \showinitializer or \hideinitializer command in the
# documentation regardless of this setting.
# Minimum value: 0, maximum value: 10000, default value: 30.

MAX_INITIALIZER_LINES  = 30

# Set the SHOW_USED_FILES tag to NO to disable the list of files generated at
# the bottom of the documentation of classes and structs. If set to YES, the
# list will mention the files that were used to generate the documentation.
# The default value is: YES.

SHOW_USED_FILES        = YES

# Set the SHOW_FILES tag to NO to disable the generation of the Files page. This
# will remove the Files entry from the Quick Index and from the Folder Tree View
# (if specified).
# The default value is: YES.

SHOW_FILES             = YES

# Set the SHOW_NAMESPACES tag to NO to disable the generation of the Namespaces
# page. This will remove the Namespaces entry from the Quick Index and from the
# Folder Tree View (if specified).
# The default value is: YES.

SHOW_NAMESPACES        = YES

# The FILE_VERSION_FILTER tag can be used to specify a program or script that
# doxygen should invoke to get the current version for each file (typically from
# the version control system). Doxygen will invoke the program by executing (via
# popen()) the command command input-file, where command is the value of the
# FILE_VERSION_FILTER tag, and input-file is the name of an input file provided
# by doxygen. Whatever the program writes to standard output is used as the file
# version. For an example see the documentation.

FILE_VERSION_FILTER    =

# The LAYOUT_FILE tag can be used to specify a layout file which will be parsed
# by doxygen. The layout file controls the global structure of the generated
# output files in an output format independent way. To create the layout file
# that represents doxygen's defaults, run doxygen with the -l option. You can
# optionally specify a file name after the option, if omitted DoxygenLayout.xml
# will be used as the name of the layout file.
#
# Note that if you run doxygen from a directory containing a file called
# DoxygenLayout.xml, doxygen will parse it automatically even if the LAYOUT_FILE
# tag is left empty.

LAYOUT_FILE            =

# The CITE_BIB_FILES tag can be used to specify one or more bib files containing
# the reference definitions. This must be a list of .bib files. The .bib
# extension is automatically appended if omitted. This requires the bibtex tool
# to be installed. See also http://en.wikipedia.org/wiki/BibTeX for more info.
# For LaTeX the style of the bibliography can be controlled using
# LATEX_BIB_STYLE. To use this feature you need bibtex and perl available in the
# search path. See also \cite for info how to create references.

CITE_BIB_FILES         =

#---------------------------------------------------------------------------
# Configuration options related to warning and progress messages
#---------------------------------------------------------------------------

# The QUIET tag can be used to turn on/off the messages that are generated to
# standard output by doxygen. If QUIET is set to YES this implies that the
# messages are off.
# The default value is: NO.

QUIET                  = NO

# The WARNINGS tag can be used to turn on/off the warning messages that are
# generated to standard error (stderr) by doxygen. If WARNINGS is set to YES
# this implies that the warnings are on.
#
# Tip: Turn warnings on while writing the documentation.
# The default value is: YES.

WARNINGS               = YES

# If the WARN_IF_UNDOCUMENTED tag is set to YES then doxygen will generate
# warnings for undocumented members. If EXTRACT_ALL is set to YES then this flag
# will automatically be disabled.
# The default value is: YES.

WARN_IF_UNDOCUMENTED   = YES

# If the WARN_IF_DOC_ERROR tag is set to YES, doxygen will generate warnings for
# potential errors in the documentation, such as not documenting some parameters
# in a documented function, or documenting parameters that don't exist or using
# markup commands wrongly.
# The default value is: YES.

WARN_IF_DOC_ERROR      = YES

# This WARN_NO_PARAMDOC option can be enabled to get warnings for functions that
# are documented, but have no documentation for their parameters or return
# value. If set to NO, doxygen will only warn about wrong or incomplete
# parameter documentation, but not about the absence of documentation.
# The default value is: NO.

WARN_NO_PARAMDOC       = NO

# If the WARN_AS_ERROR tag is set to YES then doxygen will immediately stop when
# a warning is encountered.
# The default value is: NO.

WARN_AS_ERROR          = NO

# The WARN_FORMAT tag determines the format of the warning messages that doxygen
# can produce. The string should contain the $file, $line, and $text tags, which
# will be replaced by the file and line number from which the warning originated
# and the warning text. Optionally the format may contain $version, which will
# be replaced by the version of the file (if it could be obtained via
# FILE_VERSION_FILTER)
# The default value is: $file:$line: $text.

WARN_FORMAT            = "$file:$line: $text"

# The WARN_LOGFILE tag can be used to specify a file to which warning and error
# messages should be written. If left blank the output is written to standard
# error (stderr).

WARN_LOGFILE           = doxygen_warnings.txt

#---------------------------------------------------------------------------
# Configuration options related to the input files
#---------------------------------------------------------------------------

# The INPUT tag is used to specify the files and/or directories that contain
# documented source files. You may enter file names like myfile.cpp or
# directories like /usr/src/myproject. Separate the files or directories with
# spaces. See also FILE_PATTERNS and EXTENSION_MAPPING
# Note: If this tag is empty the current directory is searched.

INPUT   = @CMAKE_CURRENT_SOURCE_DIR@/../../include @CMAKE_CURRENT_SOURCE_DIR@/../dot \
          README.md

# This tag can be used to specify the character encoding of the source files
# that doxygen parses. Internally doxygen uses the UTF-8 encoding. Doxygen uses
# libiconv (or the iconv built into libc) for the transcoding. See the libiconv
# documentation (see: http://www.gnu.org/software/libiconv) for the list of
# possible encodings.
# The default value is: UTF-8.

INPUT_ENCODING         = UTF-8

# If the value of the INPUT tag contains directories, you can use the
# FILE_PATTERNS tag to specify one or more wildcard patterns (like *.cpp and
# *.h) to filter out the source-files in the directories.
#
# Note that for custom extensions or not directly supported extensions you also
# need to set EXTENSION_MAPPING for the extension otherwise the files are not
# read by doxygen.
#
# If left blank the following patterns are tested:*.c, *.cc, *.cxx, *.cpp,
# *.c++, *.java, *.ii, *.ixx, *.ipp, *.i++, *.inl, *.idl, *.ddl, *.odl, *.h,
# *.hh, *.hxx, *.hpp, *.h++, *.cs, *.d, *.php, *.php4, *.php5, *.phtml, *.inc,
# *.m, *.markdown, *.md, *.mm, *.dox, *.py, *.pyw, *.f90, *.f, *.for, *.tcl,
# *.vhd, *.vhdl, *.ucf, *.qsf, *.as and *.js.

FILE_PATTERNS          = *.c \
                         *.cc \
                         *.cxx \
                         *.cpp \
                         *.c++ \
                         *.java \
                         *.ii \
                         *.ixx \
                         *.ipp \
                         *.i++ \
                         *.inl \
                         *.idl \
                         *.ddl \
                         *.odl \
                         *.h \
                         *.hh \
                         *.hxx \
                         *.hpp \
                         *.h++ \
                         *.cs \
                         *.d \
                         *.php \
                         *.php4 \
                         *.php5 \
                         *.phtml \
                         *.inc \
                         *.m \
                         *.markdown \
                         *.md \
                         *.mm \
                         *.dox \
                         *.py \
                         *.pyw \
                         *.f90 \
                         *.f \
                         *.for \
                         *.tcl \
                         *.vhd \
                         *.vhdl \
                         *.ucf \
                         *.qsf \
                         *.as \
                         *.js

# The RECURSIVE tag can be used to specify whether or not subdirectories should
# be searched for input files as well.
# The default value is: NO.

RECURSIVE              = YES

# The EXCLUDE tag can be used to specify files and/or directories that should be
# excluded from the INPUT source files. This way you can easily exclude a
# subdirectory from a directory tree whose root is specified with the INPUT tag.
#
# Note that relative paths are relative to the directory from which doxygen is
# run.

EXCLUDE                =

# The EXCLUDE_SYMLINKS tag can be used to select whether or not files or
# directories that are symbolic links (a Unix file system feature) are excluded
# from the input.
# The default value is: NO.

EXCLUDE_SYMLINKS       = NO

# If the value of the INPUT tag contains directories, you can use the
# EXCLUDE_PATTERNS tag to specify one or more wildcard patterns to exclude
# certain files from those directories.
#
# Note that the wildcards are matched against the file with absolute path, so to
# exclude all test directories for example use the pattern */test/*

EXCLUDE_PATTERNS       = */include/proto/*.h

# The EXCLUDE_SYMBOLS tag can be used to specify one or more symbol names
# (namespaces, classes, functions, etc.) that should be excluded from the
# output. The symbol name can be a fully qualified name, a word, or if the
# wildcard * is used, a substring. Examples: ANamespace, AClass,
# AClass::ANamespace, ANamespace::*Test
#
# Note that the wildcards are matched against the file with absolute path, so to
# exclude all test directories use the pattern */test/*

EXCLUDE_SYMBOLS        = proto

# The EXAMPLE_PATH tag can be used to specify one or more files or directories
# that contain example code fragments that are included (see the \include
# command).

EXAMPLE_PATH           =

# If the value of the EXAMPLE_PATH tag contains directories, you can use the
# EXAMPLE_PATTERNS tag to specify one or more wildcard pattern (like *.cpp and
# *.h) to filter out the source-files in the directories. If left blank all
# files are included.

EXAMPLE_PATTERNS       = *

# If the EXAMPLE_RECURSIVE tag is set to YES then subdirectories will be
# searched for input files to be used with the \include or \dontinclude commands
# irrespective of the value of the RECURSIVE tag.
# The default value is: NO.

EXAMPLE_RECURSIVE      = NO

# The IMAGE_PATH tag can be used to specify one or more files or directories
# that contain images that are to be included in the documentation (see the
# \image command).

IMAGE_PATH             =

# The INPUT_FILTER tag can be used to specify a program that doxygen should
# invoke to filter for each input file. Doxygen will invoke the filter program
# by executing (via popen()) the command:
#
# <filter> <input-file>
#
# where <filter> is the value of the INPUT_FILTER tag, and <input-file> is the
# name of an input file. Doxygen will then use the output that the filter
# program writes to standard output. If FILTER_PATTERNS is specified, this tag
# will be ignored.
#
# Note that the filter must not add or remove lines; it is applied before the
# code is scanned, but not when the output code is generated. If lines are added
# or removed, the anchors will not be placed correctly.
#
# Note that for custom extensions or not directly supported extensions you also
# need to set EXTENSION_MAPPING for the extension otherwise the files are not
# properly processed by doxygen.

INPUT_FILTER           =

# The FILTER_PATTERNS tag can be used to specify filters on a per file pattern
# basis. Doxygen will compare the file name with each pattern and apply the
# filter if there is a match. The filters are a list of the form: pattern=filter
# (like *.cpp=my_cpp_filter). See INPUT_FILTER for further information on how
# filters are used. If the FILTER_PATTERNS tag is empty or if none of the
# patterns match the file name, INPUT_FILTER is applied.
#
# Note that for custom extensions or not directly supported extensions you also
# need to set EXTENSION_MAPPING for the extension otherwise the files are not
# properly processed by doxygen.

FILTER_PATTERNS        =

# If the FILTER_SOURCE_FILES tag is set to YES, the input filter (if set using
# INPUT_FILTER) will also be used to filter the input files that are used for
# producing the source files to browse (i.e. when SOURCE_BROWSER is set to YES).
# The default value is: NO.

FILTER_SOURCE_FILES    = NO

# The FILTER_SOURCE_PATTERNS tag can be used to specify source filters per file
# pattern. A pattern will override the setting for FILTER_PATTERN (if any) and
# it is also possible to disable source filtering for a specific pattern using
# *.ext= (so without naming a filter).
# This tag requires that the tag FILTER_SOURCE_FILES is set to YES.

FILTER_SOURCE_PATTERNS =

# If the USE_MDFILE_AS_MAINPAGE tag refers to the name of a markdown file that
# is part of the input, its contents will be placed on the main page
# (index.html). This can be useful if you have a project on for instance GitHub
# and want to reuse the introduction page also for the doxygen output.

USE_MDFILE_AS_MAINPAGE = README.md

#---------------------------------------------------------------------------
# Configuration options related to source browsing
#---------------------------------------------------------------------------

# If the SOURCE_BROWSER tag is set to YES then a list of source files will be
# generated. Documented entities will be cross-referenced with these sources.
#
# Note: To get rid of all source code in the generated output, make sure that
# also VERBATIM_HEADERS is set to NO.
# The default value is: NO.

SOURCE_BROWSER         = NO

# Setting the INLINE_SOURCES tag to YES will include the body of functions,
# classes and enums directly into the documentation.
# The default value is: NO.

INLINE_SOURCES         = NO

# Setting the STRIP_CODE_COMMENTS tag to YES will instruct doxygen to hide any
# special comment blocks from generated source code fragments. Normal C, C++ and
# Fortran comments will always remain visible.
# The default value is: YES.

STRIP_CODE_COMMENTS    = YES

# If the REFERENCED_BY_RELATION tag is set to YES then for each documented
# function all documented functions referencing it will be listed.
# The default value is: NO.

REFERENCED_BY_RELATION = NO

# If the REFERENCES_RELATION tag is set to YES then for each documented function
# all documented entities called/used by that function will be listed.
# The default value is: NO.

REFERENCES_RELATION    = NO

# If the REFERENCES_LINK_SOURCE tag is set to YES and SOURCE_BROWSER tag is set
# to YES then the hyperlinks from functions in REFERENCES_RELATION and
# REFERENCED_BY_RELATION lists will link to the source code. Otherwise they will
# link to the documentation.
# The default value is: YES.

REFERENCES_LINK_SOURCE = YES

# If SOURCE_TOOLTIPS is enabled (the default) then hovering a hyperlink in the
# source code will show a tooltip with additional information such as prototype,
# brief description and links to the definition and documentation. Since this
# will make the HTML file larger and loading of large files a bit slower, you
# can opt to disable this feature.
# The default value is: YES.
# This tag requires that the tag SOURCE_BROWSER is set to YES.

SOURCE_TOOLTIPS        = YES

# If the USE_HTAGS tag is set to YES then the references to source code will
# point to the HTML generated by the htags(1) tool instead of doxygen built-in
# source browser. The htags tool is part of GNU's global source tagging system
# (see http://www.gnu.org/software/global/global.html). You will need version
# 4.8.6 or higher.
#
# To use it do the following:
# - Install the latest version of global
# - Enable SOURCE_BROWSER and USE_HTAGS in the config file
# - Make sure the INPUT points to the root of the source tree
# - Run doxygen as normal
#
# Doxygen will invoke htags (and that will in turn invoke gtags), so these
# tools must be available from the command line (i.e. in the search path).
#
# The result: instead of the source browser generated by doxygen, the links to
# source code will now point to the output of htags.
# The default value is: NO.
# This tag requires that the tag SOURCE_BROWSER is set to YES.

USE_HTAGS              = NO

# If the VERBATIM_HEADERS tag is set the YES then doxygen will generate a
# verbatim copy of the header file for each class for which an include is
# specified. Set to NO to disable this.
# See also: Section \class.
# The default value is: YES.

VERBATIM_HEADERS       = YES

# If the CLANG_ASSISTED_PARSING tag is set to YES then doxygen will use the
# clang parser (see: http://clang.llvm.org/) for more accurate parsing at the
# cost of reduced performance. This can be particularly helpful with template
# rich C++ code for which doxygen's built-in parser lacks the necessary type
# information.
# Note: The availability of this option depends on whether or not doxygen was
# generated with the -Duse-libclang=ON option for CMake.
# The default value is: NO.

CLANG_ASSISTED_PARSING = NO

# If clang assisted parsing is enabled you can provide the compiler with command
# line options that you would normally use when invoking the compiler. Note that
# the include paths will already be set by doxygen for the files and directories
# specified with INPUT and INCLUDE_PATH.
# This tag requires that the tag CLANG_ASSISTED_PARSING is set to YES.

CLANG_OPTIONS          =

#---------------------------------------------------------------------------
# Configuration options related to the alphabetical class index
#---------------------------------------------------------------------------

# If the ALPHABETICAL_INDEX tag is set to YES, an alphabetical index of all
# compounds will be generated. Enable this if the project contains a lot of
# classes, structs, unions or interfaces.
# The default value is: YES.

ALPHABETICAL_INDEX     = YES

# The COLS_IN_ALPHA_INDEX tag can be used to specify the number of columns in
# which the alphabetical index list will be split.
# Minimum value: 1, maximum value: 20, default value: 5.
# This tag requires that the tag ALPHABETICAL_INDEX is set to YES.

COLS_IN_ALPHA_INDEX    = 5

# In case all classes in a project start with a common prefix, all classes will
# be put under the same header in the alphabetical index. The IGNORE_PREFIX tag
# can be used to specify a prefix (or a list of prefixes) that should be ignored
# while generating the index headers.
# This tag requires that the tag ALPHABETICAL_INDEX is set to YES.

IGNORE_PREFIX          =

#---------------------------------------------------------------------------
# Configuration options related to the HTML output
#---------------------------------------------------------------------------

# If the GENERATE_HTML tag is set to YES, doxygen will generate HTML output
# The default value is: YES.

GENERATE_HTML          = YES

# The HTML_OUTPUT tag is used to specify where the HTML docs will be put. If a
# relative path is entered the value of OUTPUT_DIRECTORY will be put in front of
# it.
# The default directory is: html.
# This tag requires that the tag GENERATE_HTML is set to YES.

HTML_OUTPUT            = html/cpp

# The HTML_FILE_EXTENSION tag can be used to specify the file extension for each
# generated HTML page (for example: .htm, .php, .asp).
# The default value is: .html.
# This tag requires that the tag GENERATE_HTML is set to YES.

HTML_FILE_EXTENSION    = .html

# The HTML_HEADER tag can be used to specify a user-defined HTML header file for
# each generated HTML page. If the tag is left blank doxygen will generate a
# standard header.
#
# To get valid HTML the header file that includes any scripts and style sheets
# that doxygen needs, which is dependent on the configuration options used (e.g.
# the setting GENERATE_TREEVIEW). It is highly recommended to start with a
# default header using
# doxygen -w html new_header.html new_footer.html new_stylesheet.css
# YourConfigFile
# and then modify the file new_header.html. See also section "Doxygen usage"
# for information on how to generate the default header that doxygen normally
# uses.
# Note: The header is subject to change so you typically have to regenerate the
# default header when upgrading to a newer version of doxygen. For a description
# of the possible markers and block names see the documentation.
# This tag requires that the tag GENERATE_HTML is set to YES.

HTML_HEADER            =

# The HTML_FOOTER tag can be used to specify a user-defined HTML footer for each
# generated HTML page. If the tag is left blank doxygen will generate a standard
# footer. See HTML_HEADER for more information on how to generate a default
# footer and what special commands can be used inside the footer. See also
# section "Doxygen usage" for information on how to generate the default footer
# that doxygen normally uses.
# This tag requires that the tag GENERATE_HTML is set to YES.

HTML_FOOTER            =

# The HTML_STYLESHEET tag can be used to specify a user-defined cascading style
# sheet that is used by each HTML page. It can be used to fine-tune the look of
# the HTML output. If left blank doxygen will generate a default style sheet.
# See also section "Doxygen usage" for information on how to generate the style
# sheet that doxygen normally uses.
# Note: It is recommended to use HTML_EXTRA_STYLESHEET instead of this tag, as
# it is more robust and this tag (HTML_STYLESHEET) will in the future become
# obsolete.
# This tag requires that the tag GENERATE_HTML is set to YES.

HTML_STYLESHEET        =

# The HTML_EXTRA_STYLESHEET tag can be used to specify additional user-defined
# cascading style sheets that are included after the standard style sheets
# created by doxygen. Using this option one can overrule certain style aspects.
# This is preferred over using HTML_STYLESHEET since it does not replace the
# standard style sheet and is therefore more robust against future updates.
# Doxygen will copy the style sheet files to the output directory.
# Note: The order of the extra style sheet files is of importance (e.g. the last
# style sheet in the list overrules the setting of the previous ones in the
# list). For an example see the documentation.
# This tag requires that the tag GENERATE_HTML is set to YES.

HTML_EXTRA_STYLESHEET  =

# The HTML_EXTRA_FILES tag can be used to specify one or more extra images or
# other source files which should be copied to the HTML output directory. Note
# that these files will be copied to the base HTML output directory. Use the
# $relpath^ marker in the HTML_HEADER and/or HTML_FOOTER files to load these
# files. In the HTML_STYLESHEET file, use the file name only. Also note that the
# files will be copied as-is; there are no commands or markers available.
# This tag requires that the tag GENERATE_HTML is set to YES.

HTML_EXTRA_FILES       =

# The HTML_COLORSTYLE_HUE tag controls the color of the HTML output. Doxygen
# will adjust the colors in the style sheet and background images according to
# this color. Hue is specified as an angle on a colorwheel, see
# http://en.wikipedia.org/wiki/Hue for more information. For instance the value
# 0 represents red, 60 is yellow, 120 is green, 180 is cyan, 240 is blue, 300
# purple, and 360 is red again.
# Minimum value: 0, maximum value: 359, default value: 220.
# This tag requires that the tag GENERATE_HTML is set to YES.

HTML_COLORSTYLE_HUE    = 220

# The HTML_COLORSTYLE_SAT tag controls the purity (or saturation) of the colors
# in the HTML output. For a value of 0 the output will use grayscales only. A
# value of 255 will produce the most vivid colors.
# Minimum value: 0, maximum value: 255, default value: 100.
# This tag requires that the tag GENERATE_HTML is set to YES.

HTML_COLORSTYLE_SAT    = 100

# The HTML_COLORSTYLE_GAMMA tag controls the gamma correction applied to the
# luminance component of the colors in the HTML output. Values below 100
# gradually make the output lighter, whereas values above 100 make the output
# darker. The value divided by 100 is the actual gamma applied, so 80 represents
# a gamma of 0.8, The value 220 represents a gamma of 2.2, and 100 does not
# change the gamma.
# Minimum value: 40, maximum value: 240, default value: 80.
# This tag requires that the tag GENERATE_HTML is set to YES.

HTML_COLORSTYLE_GAMMA  = 80

# If the HTML_TIMESTAMP tag is set to YES then the footer of each generated HTML
# page will contain the date and time when the page was generated. Setting this
# to YES can help to show when doxygen was last run and thus if the
# documentation is up to date.
# The default value is: NO.
# This tag requires that the tag GENERATE_HTML is set to YES.

HTML_TIMESTAMP         = NO

# If the HTML_DYNAMIC_SECTIONS tag is set to YES then the generated HTML
# documentation will contain sections that can be hidden and shown after the
# page has loaded.
# The default value is: NO.
# This tag requires that the tag GENERATE_HTML is set to YES.

HTML_DYNAMIC_SECTIONS  = NO

# With HTML_INDEX_NUM_ENTRIES one can control the preferred number of entries
# shown in the various tree structured indices initially; the user can expand
# and collapse entries dynamically later on. Doxygen will expand the tree to
# such a level that at most the specified number of entries are visible (unless
# a fully collapsed tree already exceeds this amount). So setting the number of
# entries 1 will produce a full collapsed tree by default. 0 is a special value
# representing an infinite number of entries and will result in a full expanded
# tree by default.
# Minimum value: 0, maximum value: 9999, default value: 100.
# This tag requires that the tag GENERATE_HTML is set to YES.

HTML_INDEX_NUM_ENTRIES = 100

# If the GENERATE_DOCSET tag is set to YES, additional index files will be
# generated that can be used as input for Apple's Xcode 3 integrated development
# environment (see: http://developer.apple.com/tools/xcode/), introduced with
# OSX 10.5 (Leopard). To create a documentation set, doxygen will generate a
# Makefile in the HTML output directory. Running make will produce the docset in
# that directory and running make install will install the docset in
# ~/Library/Developer/Shared/Documentation/DocSets so that Xcode will find it at
# startup. See http://developer.apple.com/tools/creatingdocsetswithdoxygen.html
# for more information.
# The default value is: NO.
# This tag requires that the tag GENERATE_HTML is set to YES.

GENERATE_DOCSET        = NO

# This tag determines the name of the docset feed. A documentation feed provides
# an umbrella under which multiple documentation sets from a single provider
# (such as a company or product suite) can be grouped.
# The default value is: Doxygen generated docs.
# This tag requires that the tag GENERATE_DOCSET is set to YES.

DOCSET_FEEDNAME        = "Doxygen generated docs"

# This tag specifies a string that should uniquely identify the documentation
# set bundle. This should be a reverse domain-name style string, e.g.
# com.mycompany.MyDocSet. Doxygen will append .docset to the name.
# The default value is: org.doxygen.Project.
# This tag requires that the tag GENERATE_DOCSET is set to YES.

DOCSET_BUNDLE_ID       = org.doxygen.Project

# The DOCSET_PUBLISHER_ID tag specifies a string that should uniquely identify
# the documentation publisher. This should be a reverse domain-name style
# string, e.g. com.mycompany.MyDocSet.documentation.
# The default value is: org.doxygen.Publisher.
# This tag requires that the tag GENERATE_DOCSET is set to YES.

DOCSET_PUBLISHER_ID    = org.doxygen.Publisher

# The DOCSET_PUBLISHER_NAME tag identifies the documentation publisher.
# The default value is: Publisher.
# This tag requires that the tag GENERATE_DOCSET is set to YES.

DOCSET_PUBLISHER_NAME  = Publisher

# If the GENERATE_HTMLHELP tag is set to YES then doxygen generates three
# additional HTML index files: index.hhp, index.hhc, and index.hhk. The
# index.hhp is a project file that can be read by Microsoft's HTML Help Workshop
# (see: http://www.microsoft.com/en-us/download/details.aspx?id=21138) on
# Windows.
#
# The HTML Help Workshop contains a compiler that can convert all HTML output
# generated by doxygen into a single compiled HTML file (.chm). Compiled HTML
# files are now used as the Windows 98 help format, and will replace the old
# Windows help format (.hlp) on all Windows platforms in the future. Compressed
# HTML files also contain an index, a table of contents, and you can search for
# words in the documentation. The HTML workshop also contains a viewer for
# compressed HTML files.
# The default value is: NO.
# This tag requires that the tag GENERATE_HTML is set to YES.

GENERATE_HTMLHELP      = NO

# The CHM_FILE tag can be used to specify the file name of the resulting .chm
# file. You can add a path in front of the file if the result should not be
# written to the html output directory.
# This tag requires that the tag GENERATE_HTMLHELP is set to YES.

CHM_FILE               =

# The HHC_LOCATION tag can be used to specify the location (absolute path
# including file name) of the HTML help compiler (hhc.exe). If non-empty,
# doxygen will try to run the HTML help compiler on the generated index.hhp.
# The file has to be specified with full path.
# This tag requires that the tag GENERATE_HTMLHELP is set to YES.

HHC_LOCATION           =

# The GENERATE_CHI flag controls if a separate .chi index file is generated
# (YES) or that it should be included in the master .chm file (NO).
# The default value is: NO.
# This tag requires that the tag GENERATE_HTMLHELP is set to YES.

GENERATE_CHI           = NO

# The CHM_INDEX_ENCODING is used to encode HtmlHelp index (hhk), content (hhc)
# and project file content.
# This tag requires that the tag GENERATE_HTMLHELP is set to YES.

CHM_INDEX_ENCODING     =

# The BINARY_TOC flag controls whether a binary table of contents is generated
# (YES) or a normal table of contents (NO) in the .chm file. Furthermore it
# enables the Previous and Next buttons.
# The default value is: NO.
# This tag requires that the tag GENERATE_HTMLHELP is set to YES.

BINARY_TOC             = NO

# The TOC_EXPAND flag can be set to YES to add extra items for group members to
# the table of contents of the HTML help documentation and to the tree view.
# The default value is: NO.
# This tag requires that the tag GENERATE_HTMLHELP is set to YES.

TOC_EXPAND             = NO

# If the GENERATE_QHP tag is set to YES and both QHP_NAMESPACE and
# QHP_VIRTUAL_FOLDER are set, an additional index file will be generated that
# can be used as input for Qt's qhelpgenerator to generate a Qt Compressed Help
# (.qch) of the generated HTML documentation.
# The default value is: NO.
# This tag requires that the tag GENERATE_HTML is set to YES.

GENERATE_QHP           = NO

# If the QHG_LOCATION tag is specified, the QCH_FILE tag can be used to specify
# the file name of the resulting .qch file. The path specified is relative to
# the HTML output folder.
# This tag requires that the tag GENERATE_QHP is set to YES.

QCH_FILE               =

# The QHP_NAMESPACE tag specifies the namespace to use when generating Qt Help
# Project output. For more information please see Qt Help Project / Namespace
# (see: http://qt-project.org/doc/qt-4.8/qthelpproject.html#namespace).
# The default value is: org.doxygen.Project.
# This tag requires that the tag GENERATE_QHP is set to YES.

QHP_NAMESPACE          = org.doxygen.Project

# The QHP_VIRTUAL_FOLDER tag specifies the namespace to use when generating Qt
# Help Project output. For more information please see Qt Help Project / Virtual
# Folders (see: http://qt-project.org/doc/qt-4.8/qthelpproject.html#virtual-
# folders).
# The default value is: doc.
# This tag requires that the tag GENERATE_QHP is set to YES.

QHP_VIRTUAL_FOLDER     = doc

# If the QHP_CUST_FILTER_NAME tag is set, it specifies the name of a custom
# filter to add. For more information please see Qt Help Project / Custom
# Filters (see: http://qt-project.org/doc/qt-4.8/qthelpproject.html#custom-
# filters).
# This tag requires that the tag GENERATE_QHP is set to YES.

QHP_CUST_FILTER_NAME   =

# The QHP_CUST_FILTER_ATTRS tag specifies the list of the attributes of the
# custom filter to add. For more information please see Qt Help Project / Custom
# Filters (see: http://qt-project.org/doc/qt-4.8/qthelpproject.html#custom-
# filters).
# This tag requires that the tag GENERATE_QHP is set to YES.

QHP_CUST_FILTER_ATTRS  =

# The QHP_SECT_FILTER_ATTRS tag specifies the list of the attributes this
# project's filter section matches. Qt Help Project / Filter Attributes (see:
# http://qt-project.org/doc/qt-4.8/qthelpproject.html#filter-attributes).
# This tag requires that the tag GENERATE_QHP is set to YES.

QHP_SECT_FILTER_ATTRS  =

# The QHG_LOCATION tag can be used to specify the location of Qt's
# qhelpgenerator. If non-empty doxygen will try to run qhelpgenerator on the
# generated .qhp file.
# This tag requires that the tag GENERATE_QHP is set to YES.

QHG_LOCATION           =

# If the GENERATE_ECLIPSEHELP tag is set to YES, additional index files will be
# generated, together with the HTML files, they form an Eclipse help plugin. To
# install this plugin and make it available under the help contents menu in
# Eclipse, the contents of the directory containing the HTML and XML files needs
# to be copied into the plugins directory of eclipse. The name of the directory
# within the plugins directory should be the same as the ECLIPSE_DOC_ID value.
# After copying Eclipse needs to be restarted before the help appears.
# The default value is: NO.
# This tag requires that the tag GENERATE_HTML is set to YES.

GENERATE_ECLIPSEHELP   = NO

# A unique identifier for the Eclipse help plugin. When installing the plugin
# the directory name containing the HTML and XML files should also have this
# name. Each documentation set should have its own identifier.
# The default value is: org.doxygen.Project.
# This tag requires that the tag GENERATE_ECLIPSEHELP is set to YES.

ECLIPSE_DOC_ID         = org.doxygen.Project

# If you want full control over the layout of the generated HTML pages it might
# be necessary to disable the index and replace it with your own. The
# DISABLE_INDEX tag can be used to turn on/off the condensed index (tabs) at top
# of each HTML page. A value of NO enables the index and the value YES disables
# it. Since the tabs in the index contain the same information as the navigation
# tree, you can set this option to YES if you also set GENERATE_TREEVIEW to YES.
# The default value is: NO.
# This tag requires that the tag GENERATE_HTML is set to YES.

DISABLE_INDEX          = NO

# The GENERATE_TREEVIEW tag is used to specify whether a tree-like index
# structure should be generated to display hierarchical information. If the tag
# value is set to YES, a side panel will be generated containing a tree-like
# index structure (just like the one that is generated for HTML Help). For this
# to work a browser that supports JavaScript, DHTML, CSS and frames is required
# (i.e. any modern browser). Windows users are probably better off using the
# HTML help feature. Via custom style sheets (see HTML_EXTRA_STYLESHEET) one can
# further fine-tune the look of the index. As an example, the default style
# sheet generated by doxygen has an example that shows how to put an image at
# the root of the tree instead of the PROJECT_NAME. Since the tree basically has
# the same information as the tab index, you could consider setting
# DISABLE_INDEX to YES when enabling this option.
# The default value is: NO.
# This tag requires that the tag GENERATE_HTML is set to YES.

GENERATE_TREEVIEW      = NO

# The ENUM_VALUES_PER_LINE tag can be used to set the number of enum values that
# doxygen will group on one line in the generated HTML documentation.
#
# Note that a value of 0 will completely suppress the enum values from appearing
# in the overview section.
# Minimum value: 0, maximum value: 20, default value: 4.
# This tag requires that the tag GENERATE_HTML is set to YES.

ENUM_VALUES_PER_LINE   = 4

# If the treeview is enabled (see GENERATE_TREEVIEW) then this tag can be used
# to set the initial width (in pixels) of the frame in which the tree is shown.
# Minimum value: 0, maximum value: 1500, default value: 250.
# This tag requires that the tag GENERATE_HTML is set to YES.

TREEVIEW_WIDTH         = 250

# If the EXT_LINKS_IN_WINDOW option is set to YES, doxygen will open links to
# external symbols imported via tag files in a separate window.
# The default value is: NO.
# This tag requires that the tag GENERATE_HTML is set to YES.

EXT_LINKS_IN_WINDOW    = NO

# Use this tag to change the font size of LaTeX formulas included as images in
# the HTML documentation. When you change the font size after a successful
# doxygen run you need to manually remove any form_*.png images from the HTML
# output directory to force them to be regenerated.
# Minimum value: 8, maximum value: 50, default value: 10.
# This tag requires that the tag GENERATE_HTML is set to YES.

FORMULA_FONTSIZE       = 10

# Use the FORMULA_TRANPARENT tag to determine whether or not the images
# generated for formulas are transparent PNGs. Transparent PNGs are not
# supported properly for IE 6.0, but are supported on all modern browsers.
#
# Note that when changing this option you need to delete any form_*.png files in
# the HTML output directory before the changes have effect.
# The default value is: YES.
# This tag requires that the tag GENERATE_HTML is set to YES.

FORMULA_TRANSPARENT    = YES

# Enable the USE_MATHJAX option to render LaTeX formulas using MathJax (see
# http://www.mathjax.org) which uses client side Javascript for the rendering
# instead of using pre-rendered bitmaps. Use this if you do not have LaTeX
# installed or if you want to formulas look prettier in the HTML output. When
# enabled you may also need to install MathJax separately and configure the path
# to it using the MATHJAX_RELPATH option.
# The default value is: NO.
# This tag requires that the tag GENERATE_HTML is set to YES.

USE_MATHJAX            = NO

# When MathJax is enabled you can set the default output format to be used for
# the MathJax output. See the MathJax site (see:
# http://docs.mathjax.org/en/latest/output.html) for more details.
# Possible values are: HTML-CSS (which is slower, but has the best
# compatibility), NativeMML (i.e. MathML) and SVG.
# The default value is: HTML-CSS.
# This tag requires that the tag USE_MATHJAX is set to YES.

MATHJAX_FORMAT         = HTML-CSS

# When MathJax is enabled you need to specify the location relative to the HTML
# output directory using the MATHJAX_RELPATH option. The destination directory
# should contain the MathJax.js script. For instance, if the mathjax directory
# is located at the same level as the HTML output directory, then
# MATHJAX_RELPATH should be ../mathjax. The default value points to the MathJax
# Content Delivery Network so you can quickly see the result without installing
# MathJax. However, it is strongly recommended to install a local copy of
# MathJax from http://www.mathjax.org before deployment.
# The default value is: http://cdn.mathjax.org/mathjax/latest.
# This tag requires that the tag USE_MATHJAX is set to YES.

MATHJAX_RELPATH        = http://cdn.mathjax.org/mathjax/latest

# The MATHJAX_EXTENSIONS tag can be used to specify one or more MathJax
# extension names that should be enabled during MathJax rendering. For example
# MATHJAX_EXTENSIONS = TeX/AMSmath TeX/AMSsymbols
# This tag requires that the tag USE_MATHJAX is set to YES.

MATHJAX_EXTENSIONS     =

# The MATHJAX_CODEFILE tag can be used to specify a file with javascript pieces
# of code that will be used on startup of the MathJax code. See the MathJax site
# (see: http://docs.mathjax.org/en/latest/output.html) for more details. For an
# example see the documentation.
# This tag requires that the tag USE_MATHJAX is set to YES.

MATHJAX_CODEFILE       =

# When the SEARCHENGINE tag is enabled doxygen will generate a search box for
# the HTML output. The underlying search engine uses javascript and DHTML and
# should work on any modern browser. Note that when using HTML help
# (GENERATE_HTMLHELP), Qt help (GENERATE_QHP), or docsets (GENERATE_DOCSET)
# there is already a search function so this one should typically be disabled.
# For large projects the javascript based search engine can be slow, then
# enabling SERVER_BASED_SEARCH may provide a better solution. It is possible to
# search using the keyboard; to jump to the search box use <access key> + S
# (what the <access key> is depends on the OS and browser, but it is typically
# <CTRL>, <ALT>/<option>, or both). Inside the search box use the <cursor down
# key> to jump into the search results window, the results can be navigated
# using the <cursor keys>. Press <Enter> to select an item or <escape> to cancel
# the search. The filter options can be selected when the cursor is inside the
# search box by pressing <Shift>+<cursor down>. Also here use the <cursor keys>
# to select a filter and <Enter> or <escape> to activate or cancel the filter
# option.
# The default value is: YES.
# This tag requires that the tag GENERATE_HTML is set to YES.

SEARCHENGINE           = YES

# When the SERVER_BASED_SEARCH tag is enabled the search engine will be
# implemented using a web server instead of a web client using Javascript. There
# are two flavors of web server based searching depending on the EXTERNAL_SEARCH
# setting. When disabled, doxygen will generate a PHP script for searching and
# an index file used by the script. When EXTERNAL_SEARCH is enabled the indexing
# and searching needs to be provided by external tools. See the section
# "External Indexing and Searching" for details.
# The default value is: NO.
# This tag requires that the tag SEARCHENGINE is set to YES.

SERVER_BASED_SEARCH    = NO

# When EXTERNAL_SEARCH tag is enabled doxygen will no longer generate the PHP
# script for searching. Instead the search results are written to an XML file
# which needs to be processed by an external indexer. Doxygen will invoke an
# external search engine pointed to by the SEARCHENGINE_URL option to obtain the
# search results.
#
# Doxygen ships with an example indexer (doxyindexer) and search engine
# (doxysearch.cgi) which are based on the open source search engine library
# Xapian (see: http://xapian.org/).
#
# See the section "External Indexing and Searching" for details.
# The default value is: NO.
# This tag requires that the tag SEARCHENGINE is set to YES.

EXTERNAL_SEARCH        = NO

# The SEARCHENGINE_URL should point to a search engine hosted by a web server
# which will return the search results when EXTERNAL_SEARCH is enabled.
#
# Doxygen ships with an example indexer (doxyindexer) and search engine
# (doxysearch.cgi) which are based on the open source search engine library
# Xapian (see: http://xapian.org/). See the section "External Indexing and
# Searching" for details.
# This tag requires that the tag SEARCHENGINE is set to YES.

SEARCHENGINE_URL       =

# When SERVER_BASED_SEARCH and EXTERNAL_SEARCH are both enabled the unindexed
# search data is written to a file for indexing by an external tool. With the
# SEARCHDATA_FILE tag the name of this file can be specified.
# The default file is: searchdata.xml.
# This tag requires that the tag SEARCHENGINE is set to YES.

SEARCHDATA_FILE        = searchdata.xml

# When SERVER_BASED_SEARCH and EXTERNAL_SEARCH are both enabled the
# EXTERNAL_SEARCH_ID tag can be used as an identifier for the project. This is
# useful in combination with EXTRA_SEARCH_MAPPINGS to search through multiple
# projects and redirect the results back to the right project.
# This tag requires that the tag SEARCHENGINE is set to YES.

EXTERNAL_SEARCH_ID     =

# The EXTRA_SEARCH_MAPPINGS tag can be used to enable searching through doxygen
# projects other than the one defined by this configuration file, but that are
# all added to the same external search index. Each project needs to have a
# unique id set via EXTERNAL_SEARCH_ID. The search mapping then maps the id of
# to a relative location where the documentation can be found. The format is:
# EXTRA_SEARCH_MAPPINGS = tagname1=loc1 tagname2=loc2 ...
# This tag requires that the tag SEARCHENGINE is set to YES.

EXTRA_SEARCH_MAPPINGS  =

#---------------------------------------------------------------------------
# Configuration options related to the LaTeX output
#---------------------------------------------------------------------------

# If the GENERATE_LATEX tag is set to YES, doxygen will generate LaTeX output.
# The default value is: YES.

GENERATE_LATEX         = NO

# The LATEX_OUTPUT tag is used to specify where the LaTeX docs will be put. If a
# relative path is entered the value of OUTPUT_DIRECTORY will be put in front of
# it.
# The default directory is: latex.
# This tag requires that the tag GENERATE_LATEX is set to YES.

LATEX_OUTPUT           = latex

# The LATEX_CMD_NAME tag can be used to specify the LaTeX command name to be
# invoked.
#
# Note that when enabling USE_PDFLATEX this option is only used for generating
# bitmaps for formulas in the HTML output, but not in the Makefile that is
# written to the output directory.
# The default file is: latex.
# This tag requires that the tag GENERATE_LATEX is set to YES.

LATEX_CMD_NAME         = latex

# The MAKEINDEX_CMD_NAME tag can be used to specify the command name to generate
# index for LaTeX.
# The default file is: makeindex.
# This tag requires that the tag GENERATE_LATEX is set to YES.

MAKEINDEX_CMD_NAME     = makeindex

# If the COMPACT_LATEX tag is set to YES, doxygen generates more compact LaTeX
# documents. This may be useful for small projects and may help to save some
# trees in general.
# The default value is: NO.
# This tag requires that the tag GENERATE_LATEX is set to YES.

COMPACT_LATEX          = NO

# The PAPER_TYPE tag can be used to set the paper type that is used by the
# printer.
# Possible values are: a4 (210 x 297 mm), letter (8.5 x 11 inches), legal (8.5 x
# 14 inches) and executive (7.25 x 10.5 inches).
# The default value is: a4.
# This tag requires that the tag GENERATE_LATEX is set to YES.

PAPER_TYPE             = a4

# The EXTRA_PACKAGES tag can be used to specify one or more LaTeX package names
# that should be included in the LaTeX output. The package can be specified just
# by its name or with the correct syntax as to be used with the LaTeX
# \usepackage command. To get the times font for instance you can specify :
# EXTRA_PACKAGES=times or EXTRA_PACKAGES={times}
# To use the option intlimits with the amsmath package you can specify:
# EXTRA_PACKAGES=[intlimits]{amsmath}
# If left blank no extra packages will be included.
# This tag requires that the tag GENERATE_LATEX is set to YES.

EXTRA_PACKAGES         =

# The LATEX_HEADER tag can be used to specify a personal LaTeX header for the
# generated LaTeX document. The header should contain everything until the first
# chapter. If it is left blank doxygen will generate a standard header. See
# section "Doxygen usage" for information on how to let doxygen write the
# default header to a separate file.
#
# Note: Only use a user-defined header if you know what you are doing! The
# following commands have a special meaning inside the header: $title,
# $datetime, $date, $doxygenversion, $projectname, $projectnumber,
# $projectbrief, $projectlogo. Doxygen will replace $title with the empty
# string, for the replacement values of the other commands the user is referred
# to HTML_HEADER.
# This tag requires that the tag GENERATE_LATEX is set to YES.

LATEX_HEADER           =

# The LATEX_FOOTER tag can be used to specify a personal LaTeX footer for the
# generated LaTeX document. The footer should contain everything after the last
# chapter. If it is left blank doxygen will generate a standard footer. See
# LATEX_HEADER for more information on how to generate a default footer and what
# special commands can be used inside the footer.
#
# Note: Only use a user-defined footer if you know what you are doing!
# This tag requires that the tag GENERATE_LATEX is set to YES.

LATEX_FOOTER           =

# The LATEX_EXTRA_STYLESHEET tag can be used to specify additional user-defined
# LaTeX style sheets that are included after the standard style sheets created
# by doxygen. Using this option one can overrule certain style aspects. Doxygen
# will copy the style sheet files to the output directory.
# Note: The order of the extra style sheet files is of importance (e.g. the last
# style sheet in the list overrules the setting of the previous ones in the
# list).
# This tag requires that the tag GENERATE_LATEX is set to YES.

LATEX_EXTRA_STYLESHEET =

# The LATEX_EXTRA_FILES tag can be used to specify one or more extra images or
# other source files which should be copied to the LATEX_OUTPUT output
# directory. Note that the files will be copied as-is; there are no commands or
# markers available.
# This tag requires that the tag GENERATE_LATEX is set to YES.

LATEX_EXTRA_FILES      =

# If the PDF_HYPERLINKS tag is set to YES, the LaTeX that is generated is
# prepared for conversion to PDF (using ps2pdf or pdflatex). The PDF file will
# contain links (just like the HTML output) instead of page references. This
# makes the output suitable for online browsing using a PDF viewer.
# The default value is: YES.
# This tag requires that the tag GENERATE_LATEX is set to YES.

PDF_HYPERLINKS         = YES

# If the USE_PDFLATEX tag is set to YES, doxygen will use pdflatex to generate
# the PDF file directly from the LaTeX files. Set this option to YES, to get a
# higher quality PDF documentation.
# The default value is: YES.
# This tag requires that the tag GENERATE_LATEX is set to YES.

USE_PDFLATEX           = YES

# If the LATEX_BATCHMODE tag is set to YES, doxygen will add the \batchmode
# command to the generated LaTeX files. This will instruct LaTeX to keep running
# if errors occur, instead of asking the user for help. This option is also used
# when generating formulas in HTML.
# The default value is: NO.
# This tag requires that the tag GENERATE_LATEX is set to YES.

LATEX_BATCHMODE        = NO

# If the LATEX_HIDE_INDICES tag is set to YES then doxygen will not include the
# index chapters (such as File Index, Compound Index, etc.) in the output.
# The default value is: NO.
# This tag requires that the tag GENERATE_LATEX is set to YES.

LATEX_HIDE_INDICES     = NO

# If the LATEX_SOURCE_CODE tag is set to YES then doxygen will include source
# code with syntax highlighting in the LaTeX output.
#
# Note that which sources are shown also depends on other settings such as
# SOURCE_BROWSER.
# The default value is: NO.
# This tag requires that the tag GENERATE_LATEX is set to YES.

LATEX_SOURCE_CODE      = NO

# The LATEX_BIB_STYLE tag can be used to specify the style to use for the
# bibliography, e.g. plainnat, or ieeetr. See
# http://en.wikipedia.org/wiki/BibTeX and \cite for more info.
# The default value is: plain.
# This tag requires that the tag GENERATE_LATEX is set to YES.

LATEX_BIB_STYLE        = plain

# If the LATEX_TIMESTAMP tag is set to YES then the footer of each generated
# page will contain the date and time when the page was generated. Setting this
# to NO can help when comparing the output of multiple runs.
# The default value is: NO.
# This tag requires that the tag GENERATE_LATEX is set to YES.

LATEX_TIMESTAMP        = NO

#---------------------------------------------------------------------------
# Configuration options related to the RTF output
#---------------------------------------------------------------------------

# If the GENERATE_RTF tag is set to YES, doxygen will generate RTF output. The
# RTF output is optimized for Word 97 and may not look too pretty with other RTF
# readers/editors.
# The default value is: NO.

GENERATE_RTF           = NO

# The RTF_OUTPUT tag is used to specify where the RTF docs will be put. If a
# relative path is entered the value of OUTPUT_DIRECTORY will be put in front of
# it.
# The default directory is: rtf.
# This tag requires that the tag GENERATE_RTF is set to YES.

RTF_OUTPUT             = rtf

# If the COMPACT_RTF tag is set to YES, doxygen generates more compact RTF
# documents. This may be useful for small projects and may help to save some
# trees in general.
# The default value is: NO.
# This tag requires that the tag GENERATE_RTF is set to YES.

COMPACT_RTF            = NO

# If the RTF_HYPERLINKS tag is set to YES, the RTF that is generated will
# contain hyperlink fields. The RTF file will contain links (just like the HTML
# output) instead of page references. This makes the output suitable for online
# browsing using Word or some other Word compatible readers that support those
# fields.
#
# Note: WordPad (write) and others do not support links.
# The default value is: NO.
# This tag requires that the tag GENERATE_RTF is set to YES.

RTF_HYPERLINKS         = NO

# Load stylesheet definitions from file. Syntax is similar to doxygen's config
# file, i.e. a series of assignments. You only have to provide replacements,
# missing definitions are set to their default value.
#
# See also section "Doxygen usage" for information on how to generate the
# default style sheet that doxygen normally uses.
# This tag requires that the tag GENERATE_RTF is set to YES.

RTF_STYLESHEET_FILE    =

# Set optional variables used in the generation of an RTF document. Syntax is
# similar to doxygen's config file. A template extensions file can be generated
# using doxygen -e rtf extensionFile.
# This tag requires that the tag GENERATE_RTF is set to YES.

RTF_EXTENSIONS_FILE    =

# If the RTF_SOURCE_CODE tag is set to YES then doxygen will include source code
# with syntax highlighting in the RTF output.
#
# Note that which sources are shown also depends on other settings such as
# SOURCE_BROWSER.
# The default value is: NO.
# This tag requires that the tag GENERATE_RTF is set to YES.

RTF_SOURCE_CODE        = NO

#---------------------------------------------------------------------------
# Configuration options related to the man page output
#---------------------------------------------------------------------------

# If the GENERATE_MAN tag is set to YES, doxygen will generate man pages for
# classes and files.
# The default value is: NO.

GENERATE_MAN           = NO

# The MAN_OUTPUT tag is used to specify where the man pages will be put. If a
# relative path is entered the value of OUTPUT_DIRECTORY will be put in front of
# it. A directory man3 will be created inside the directory specified by
# MAN_OUTPUT.
# The default directory is: man.
# This tag requires that the tag GENERATE_MAN is set to YES.

MAN_OUTPUT             = man

# The MAN_EXTENSION tag determines the extension that is added to the generated
# man pages. In case the manual section does not start with a number, the number
# 3 is prepended. The dot (.) at the beginning of the MAN_EXTENSION tag is
# optional.
# The default value is: .3.
# This tag requires that the tag GENERATE_MAN is set to YES.

MAN_EXTENSION          = .3

# The MAN_SUBDIR tag determines the name of the directory created within
# MAN_OUTPUT in which the man pages are placed. If defaults to man followed by
# MAN_EXTENSION with the initial . removed.
# This tag requires that the tag GENERATE_MAN is set to YES.

MAN_SUBDIR             =

# If the MAN_LINKS tag is set to YES and doxygen generates man output, then it
# will generate one additional man file for each entity documented in the real
# man page(s). These additional files only source the real man page, but without
# them the man command would be unable to find the correct page.
# The default value is: NO.
# This tag requires that the tag GENERATE_MAN is set to YES.

MAN_LINKS              = NO

#---------------------------------------------------------------------------
# Configuration options related to the XML output
#---------------------------------------------------------------------------

# If the GENERATE_XML tag is set to YES, doxygen will generate an XML file that
# captures the structure of the code including all documentation.
# The default value is: NO.

GENERATE_XML           = NO

# The XML_OUTPUT tag is used to specify where the XML pages will be put. If a
# relative path is entered the value of OUTPUT_DIRECTORY will be put in front of
# it.
# The default directory is: xml.
# This tag requires that the tag GENERATE_XML is set to YES.

XML_OUTPUT             = xml

# If the XML_PROGRAMLISTING tag is set to YES, doxygen will dump the program
# listings (including syntax highlighting and cross-referencing information) to
# the XML output. Note that enabling this will significantly increase the size
# of the XML output.
# The default value is: YES.
# This tag requires that the tag GENERATE_XML is set to YES.

XML_PROGRAMLISTING     = YES

#---------------------------------------------------------------------------
# Configuration options related to the DOCBOOK output
#---------------------------------------------------------------------------

# If the GENERATE_DOCBOOK tag is set to YES, doxygen will generate Docbook files
# that can be used to generate PDF.
# The default value is: NO.

GENERATE_DOCBOOK       = NO

# The DOCBOOK_OUTPUT tag is used to specify where the Docbook pages will be put.
# If a relative path is entered the value of OUTPUT_DIRECTORY will be put in
# front of it.
# The default directory is: docbook.
# This tag requires that the tag GENERATE_DOCBOOK is set to YES.

DOCBOOK_OUTPUT         = docbook

# If the DOCBOOK_PROGRAMLISTING tag is set to YES, doxygen will include the
# program listings (including syntax highlighting and cross-referencing
# information) to the DOCBOOK output. Note that enabling this will significantly
# increase the size of the DOCBOOK output.
# The default value is: NO.
# This tag requires that the tag GENERATE_DOCBOOK is set to YES.

DOCBOOK_PROGRAMLISTING = NO

#---------------------------------------------------------------------------
# Configuration options for the AutoGen Definitions output
#---------------------------------------------------------------------------

# If the GENERATE_AUTOGEN_DEF tag is set to YES, doxygen will generate an
# AutoGen Definitions (see http://autogen.sf.net) file that captures the
# structure of the code including all documentation. Note that this feature is
# still experimental and incomplete at the moment.
# The default value is: NO.

GENERATE_AUTOGEN_DEF   = NO

#---------------------------------------------------------------------------
# Configuration options related to the Perl module output
#---------------------------------------------------------------------------

# If the GENERATE_PERLMOD tag is set to YES, doxygen will generate a Perl module
# file that captures the structure of the code including all documentation.
#
# Note that this feature is still experimental and incomplete at the moment.
# The default value is: NO.

GENERATE_PERLMOD       = NO

# If the PERLMOD_LATEX tag is set to YES, doxygen will generate the necessary
# Makefile rules, Perl scripts and LaTeX code to be able to generate PDF and DVI
# output from the Perl module output.
# The default value is: NO.
# This tag requires that the tag GENERATE_PERLMOD is set to YES.

PERLMOD_LATEX          = NO

# If the PERLMOD_PRETTY tag is set to YES, the Perl module output will be nicely
# formatted so it can be parsed by a human reader. This is useful if you want to
# understand what is going on. On the other hand, if this tag is set to NO, the
# size of the Perl module output will be much smaller and Perl will parse it
# just the same.
# The default value is: YES.
# This tag requires that the tag GENERATE_PERLMOD is set to YES.

PERLMOD_PRETTY         = YES

# The names of the make variables in the generated doxyrules.make file are
# prefixed with the string contained in PERLMOD_MAKEVAR_PREFIX. This is useful
# so different doxyrules.make files included by the same Makefile don't
# overwrite each other's variables.
# This tag requires that the tag GENERATE_PERLMOD is set to YES.

PERLMOD_MAKEVAR_PREFIX =

#---------------------------------------------------------------------------
# Configuration options related to the preprocessor
#---------------------------------------------------------------------------

# If the ENABLE_PREPROCESSING tag is set to YES, doxygen will evaluate all
# C-preprocessor directives found in the sources and include files.
# The default value is: YES.

ENABLE_PREPROCESSING   = YES

# If the MACRO_EXPANSION tag is set to YES, doxygen will expand all macro names
# in the source code. If set to NO, only conditional compilation will be
# performed. Macro expansion can be done in a controlled way by setting
# EXPAND_ONLY_PREDEF to YES.
# The default value is: NO.
# This tag requires that the tag ENABLE_PREPROCESSING is set to YES.

MACRO_EXPANSION        = YES

# If the EXPAND_ONLY_PREDEF and MACRO_EXPANSION tags are both set to YES then
# the macro expansion is limited to the macros specified with the PREDEFINED and
# EXPAND_AS_DEFINED tags.
# The default value is: NO.
# This tag requires that the tag ENABLE_PREPROCESSING is set to YES.

EXPAND_ONLY_PREDEF     = YES

# If the SEARCH_INCLUDES tag is set to YES, the include files in the
# INCLUDE_PATH will be searched if a #include is found.
# The default value is: YES.
# This tag requires that the tag ENABLE_PREPROCESSING is set to YES.

SEARCH_INCLUDES        = YES

# The INCLUDE_PATH tag can be used to specify one or more directories that
# contain include files that are not input files but should be processed by the
# preprocessor.
# This tag requires that the tag SEARCH_INCLUDES is set to YES.

INCLUDE_PATH           =

# You can use the INCLUDE_FILE_PATTERNS tag to specify one or more wildcard
# patterns (like *.h and *.hpp) to filter out the header-files in the
# directories. If left blank, the patterns specified with FILE_PATTERNS will be
# used.
# This tag requires that the tag ENABLE_PREPROCESSING is set to YES.

INCLUDE_FILE_PATTERNS  =

# The PREDEFINED tag can be used to specify one or more macro names that are
# defined before the preprocessor is started (similar to the -D option of e.g.
# gcc). The argument of the tag is a list of macros of the form: name or
# name=definition (no spaces). If the definition and the "=" are omitted, "=1"
# is assumed. To prevent a macro definition from being undefined via #undef or
# recursively expanded use the := operator instead of the = operator.
# This tag requires that the tag ENABLE_PREPROCESSING is set to YES.

PREDEFINED             = GTIRB_DEPRECATED_UTILS

# If the MACRO_EXPANSION and EXPAND_ONLY_PREDEF tags are set to YES then this
# tag can be used to specify a list of macro names that should be expanded. The
# macro definition that is found in the sources will be used. Use the PREDEFINED
# tag if you want to use a different macro definition that overrules the
# definition found in the source code.
# This tag requires that the tag ENABLE_PREPROCESSING is set to YES.

EXPAND_AS_DEFINED      =

# If the SKIP_FUNCTION_MACROS tag is set to YES then doxygen's preprocessor will
# remove all references to function-like macros that are alone on a line, have
# an all uppercase name, and do not end with a semicolon. Such function macros
# are typically used for boiler-plate code, and will confuse the parser if not
# removed.
# The default value is: YES.
# This tag requires that the tag ENABLE_PREPROCESSING is set to YES.

SKIP_FUNCTION_MACROS   = YES

#---------------------------------------------------------------------------
# Configuration options related to external references
#---------------------------------------------------------------------------

# The TAGFILES tag can be used to specify one or more tag files. For each tag
# file the location of the external documentation should be added. The format of
# a tag file without this location is as follows:
# TAGFILES = file1 file2 ...
# Adding location for the tag files is done as follows:
# TAGFILES = file1=loc1 "file2 = loc2" ...
# where loc1 and loc2 can be relative or absolute paths or URLs. See the
# section "Linking to external documentation" for more information about the use
# of tag files.
# Note: Each tag file must have a unique name (where the name does NOT include
# the path). If a tag file is not located in the directory in which doxygen is
# run, you must also specify the path to the tagfile here.

TAGFILES               =

# When a file name is specified after GENERATE_TAGFILE, doxygen will create a
# tag file that is based on the input files it reads. See section "Linking to
# external documentation" for more information about the usage of tag files.

GENERATE_TAGFILE       = @CPP_TAGFILE@

# If the ALLEXTERNALS tag is set to YES, all external class will be listed in
# the class index. If set to NO, only the inherited external classes will be
# listed.
# The default value is: NO.

ALLEXTERNALS           = NO

# If the EXTERNAL_GROUPS tag is set to YES, all external groups will be listed
# in the modules index. If set to NO, only the current project's groups will be
# listed.
# The default value is: YES.

EXTERNAL_GROUPS        = YES

# If the EXTERNAL_PAGES tag is set to YES, all external pages will be listed in
# the related pages index. If set to NO, only the current project's pages will
# be listed.
# The default value is: YES.

EXTERNAL_PAGES         = YES

# The PERL_PATH should be the absolute path and name of the perl script
# interpreter (i.e. the result of 'which perl').
# The default file (with absolute path) is: /usr/bin/perl.

PERL_PATH              = /usr/bin/perl

#---------------------------------------------------------------------------
# Configuration options related to the dot tool
#---------------------------------------------------------------------------

# If the CLASS_DIAGRAMS tag is set to YES, doxygen will generate a class diagram
# (in HTML and LaTeX) for classes with base or super classes. Setting the tag to
# NO turns the diagrams off. Note that this option also works with HAVE_DOT
# disabled, but it is recommended to install and use dot, since it yields more
# powerful graphs.
# The default value is: YES.

CLASS_DIAGRAMS         = YES

# You can define message sequence charts within doxygen comments using the \msc
# command. Doxygen will then run the mscgen tool (see:
# http://www.mcternan.me.uk/mscgen/)) to produce the chart and insert it in the
# documentation. The MSCGEN_PATH tag allows you to specify the directory where
# the mscgen tool resides. If left empty the tool is assumed to be found in the
# default search path.

MSCGEN_PATH            =

# You can include diagrams made with dia in doxygen documentation. Doxygen will
# then run dia to produce the diagram and insert it in the documentation. The
# DIA_PATH tag allows you to specify the directory where the dia binary resides.
# If left empty dia is assumed to be found in the default search path.

DIA_PATH               =

# If set to YES the inheritance and collaboration graphs will hide inheritance
# and usage relations if the target is undocumented or is not a class.
# The default value is: YES.

HIDE_UNDOC_RELATIONS   = YES

# If you set the HAVE_DOT tag to YES then doxygen will assume the dot tool is
# available from the path. This tool is part of Graphviz (see:
# http://www.graphviz.org/), a graph visualization toolkit from AT&T and Lucent
# Bell Labs. The other options in this section have no effect if this option is
# set to NO
# The default value is: YES.

HAVE_DOT               = YES

# The DOT_NUM_THREADS specifies the number of dot invocations doxygen is allowed
# to run in parallel. When set to 0 doxygen will base this on the number of
# processors available in the system. You can set it explicitly to a value
# larger than 0 to get control over the balance between CPU load and processing
# speed.
# Minimum value: 0, maximum value: 32, default value: 0.
# This tag requires that the tag HAVE_DOT is set to YES.

DOT_NUM_THREADS        = 0

# When you want a differently looking font in the dot files that doxygen
# generates you can specify the font name using DOT_FONTNAME. You need to make
# sure dot is able to find the font, which can be done by putting it in a
# standard location or by setting the DOTFONTPATH environment variable or by
# setting DOT_FONTPATH to the directory containing the font.
# The default value is: Helvetica.
# This tag requires that the tag HAVE_DOT is set to YES.

DOT_FONTNAME           = Helvetica

# The DOT_FONTSIZE tag can be used to set the size (in points) of the font of
# dot graphs.
# Minimum value: 4, maximum value: 24, default value: 10.
# This tag requires that the tag HAVE_DOT is set to YES.

DOT_FONTSIZE           = 10

# By default doxygen will tell dot to use the default font as specified with
# DOT_FONTNAME. If you specify a different font using DOT_FONTNAME you can set
# the path where dot can find it using this tag.
# This tag requires that the tag HAVE_DOT is set to YES.

DOT_FONTPATH           =

# If the CLASS_GRAPH tag is set to YES then doxygen will generate a graph for
# each documented class showing the direct and indirect inheritance relations.
# Setting this tag to YES will force the CLASS_DIAGRAMS tag to NO.
# The default value is: YES.
# This tag requires that the tag HAVE_DOT is set to YES.

CLASS_GRAPH            = YES

# If the COLLABORATION_GRAPH tag is set to YES then doxygen will generate a
# graph for each documented class showing the direct and indirect implementation
# dependencies (inheritance, containment, and class references variables) of the
# class with other documented classes.
# The default value is: YES.
# This tag requires that the tag HAVE_DOT is set to YES.

COLLABORATION_GRAPH    = YES

# If the GROUP_GRAPHS tag is set to YES then doxygen will generate a graph for
# groups, showing the direct groups dependencies.
# The default value is: YES.
# This tag requires that the tag HAVE_DOT is set to YES.

GROUP_GRAPHS           = YES

# If the UML_LOOK tag is set to YES, doxygen will generate inheritance and
# collaboration diagrams in a style similar to the OMG's Unified Modeling
# Language.
# The default value is: NO.
# This tag requires that the tag HAVE_DOT is set to YES.

UML_LOOK               = NO

# If the UML_LOOK tag is enabled, the fields and methods are shown inside the
# class node. If there are many fields or methods and many nodes the graph may
# become too big to be useful. The UML_LIMIT_NUM_FIELDS threshold limits the
# number of items for each type to make the size more manageable. Set this to 0
# for no limit. Note that the threshold may be exceeded by 50% before the limit
# is enforced. So when you set the threshold to 10, up to 15 fields may appear,
# but if the number exceeds 15, the total amount of fields shown is limited to
# 10.
# Minimum value: 0, maximum value: 100, default value: 10.
# This tag requires that the tag HAVE_DOT is set to YES.

UML_LIMIT_NUM_FIELDS   = 10

# If the TEMPLATE_RELATIONS tag is set to YES then the inheritance and
# collaboration graphs will show the relations between templates and their
# instances.
# The default value is: NO.
# This tag requires that the tag HAVE_DOT is set to YES.

TEMPLATE_RELATIONS     = NO

# If the INCLUDE_GRAPH, ENABLE_PREPROCESSING and SEARCH_INCLUDES tags are set to
# YES then doxygen will generate a graph for each documented file showing the
# direct and indirect include dependencies of the file with other documented
# files.
# The default value is: YES.
# This tag requires that the tag HAVE_DOT is set to YES.

INCLUDE_GRAPH          = YES

# If the INCLUDED_BY_GRAPH, ENABLE_PREPROCESSING and SEARCH_INCLUDES tags are
# set to YES then doxygen will generate a graph for each documented file showing
# the direct and indirect include dependencies of the file with other documented
# files.
# The default value is: YES.
# This tag requires that the tag HAVE_DOT is set to YES.

INCLUDED_BY_GRAPH      = YES

# If the CALL_GRAPH tag is set to YES then doxygen will generate a call
# dependency graph for every global function or class method.
#
# Note that enabling this option will significantly increase the time of a run.
# So in most cases it will be better to enable call graphs for selected
# functions only using the \callgraph command. Disabling a call graph can be
# accomplished by means of the command \hidecallgraph.
# The default value is: NO.
# This tag requires that the tag HAVE_DOT is set to YES.

CALL_GRAPH             = NO

# If the CALLER_GRAPH tag is set to YES then doxygen will generate a caller
# dependency graph for every global function or class method.
#
# Note that enabling this option will significantly increase the time of a run.
# So in most cases it will be better to enable caller graphs for selected
# functions only using the \callergraph command. Disabling a caller graph can be
# accomplished by means of the command \hidecallergraph.
# The default value is: NO.
# This tag requires that the tag HAVE_DOT is set to YES.

CALLER_GRAPH           = NO

# If the GRAPHICAL_HIERARCHY tag is set to YES then doxygen will graphical
# hierarchy of all classes instead of a textual one.
# The default value is: YES.
# This tag requires that the tag HAVE_DOT is set to YES.

GRAPHICAL_HIERARCHY    = YES

# If the DIRECTORY_GRAPH tag is set to YES then doxygen will show the
# dependencies a directory has on other directories in a graphical way. The
# dependency relations are determined by the #include relations between the
# files in the directories.
# The default value is: YES.
# This tag requires that the tag HAVE_DOT is set to YES.

DIRECTORY_GRAPH        = YES

# The DOT_IMAGE_FORMAT tag can be used to set the image format of the images
# generated by dot. For an explanation of the image formats see the section
# output formats in the documentation of the dot tool (Graphviz (see:
# http://www.graphviz.org/)).
# Note: If you choose svg you need to set HTML_FILE_EXTENSION to xhtml in order
# to make the SVG files visible in IE 9+ (other browsers do not have this
# requirement).
# Possible values are: png, png:cairo, png:cairo:cairo, png:cairo:gd, png:gd,
# png:gd:gd, jpg, jpg:cairo, jpg:cairo:gd, jpg:gd, jpg:gd:gd, gif, gif:cairo,
# gif:cairo:gd, gif:gd, gif:gd:gd, svg, png:gd, png:gd:gd, png:cairo,
# png:cairo:gd, png:cairo:cairo, png:cairo:gdiplus, png:gdiplus and
# png:gdiplus:gdiplus.
# The default value is: png.
# This tag requires that the tag HAVE_DOT is set to YES.

DOT_IMAGE_FORMAT       = png

# If DOT_IMAGE_FORMAT is set to svg, then this option can be set to YES to
# enable generation of interactive SVG images that allow zooming and panning.
#
# Note that this requires a modern browser other than Internet Explorer. Tested
# and working are Firefox, Chrome, Safari, and Opera.
# Note: For IE 9+ you need to set HTML_FILE_EXTENSION to xhtml in order to make
# the SVG files visible. Older versions of IE do not have SVG support.
# The default value is: NO.
# This tag requires that the tag HAVE_DOT is set to YES.

INTERACTIVE_SVG        = NO

# The DOT_PATH tag can be used to specify the path where the dot tool can be
# found. If left blank, it is assumed the dot tool can be found in the path.
# This tag requires that the tag HAVE_DOT is set to YES.

DOT_PATH               =

# The DOTFILE_DIRS tag can be used to specify one or more directories that
# contain dot files that are included in the documentation (see the \dotfile
# command).
# This tag requires that the tag HAVE_DOT is set to YES.

DOTFILE_DIRS           =

# The MSCFILE_DIRS tag can be used to specify one or more directories that
# contain msc files that are included in the documentation (see the \mscfile
# command).

MSCFILE_DIRS           =

# The DIAFILE_DIRS tag can be used to specify one or more directories that
# contain dia files that are included in the documentation (see the \diafile
# command).

DIAFILE_DIRS           =

# When using plantuml, the PLANTUML_JAR_PATH tag should be used to specify the
# path where java can find the plantuml.jar file. If left blank, it is assumed
# PlantUML is not used or called during a preprocessing step. Doxygen will
# generate a warning when it encounters a \startuml command in this case and
# will not generate output for the diagram.

PLANTUML_JAR_PATH      =

# When using plantuml, the specified paths are searched for files specified by
# the !include statement in a plantuml block.

PLANTUML_INCLUDE_PATH  =

# The DOT_GRAPH_MAX_NODES tag can be used to set the maximum number of nodes
# that will be shown in the graph. If the number of nodes in a graph becomes
# larger than this value, doxygen will truncate the graph, which is visualized
# by representing a node as a red box. Note that doxygen if the number of direct
# children of the root node in a graph is already larger than
# DOT_GRAPH_MAX_NODES then the graph will not be shown at all. Also note that
# the size of a graph can be further restricted by MAX_DOT_GRAPH_DEPTH.
# Minimum value: 0, maximum value: 10000, default value: 50.
# This tag requires that the tag HAVE_DOT is set to YES.

DOT_GRAPH_MAX_NODES    = 50

# The MAX_DOT_GRAPH_DEPTH tag can be used to set the maximum depth of the graphs
# generated by dot. A depth value of 3 means that only nodes reachable from the
# root by following a path via at most 3 edges will be shown. Nodes that lay
# further from the root node will be omitted. Note that setting this option to 1
# or 2 may greatly reduce the computation time needed for large code bases. Also
# note that the size of a graph can be further restricted by
# DOT_GRAPH_MAX_NODES. Using a depth of 0 means no depth restriction.
# Minimum value: 0, maximum value: 1000, default value: 0.
# This tag requires that the tag HAVE_DOT is set to YES.

MAX_DOT_GRAPH_DEPTH    = 0

# Set the DOT_TRANSPARENT tag to YES to generate images with a transparent
# background. This is disabled by default, because dot on Windows does not seem
# to support this out of the box.
#
# Warning: Depending on the platform used, enabling this option may lead to
# badly anti-aliased labels on the edges of a graph (i.e. they become hard to
# read).
# The default value is: NO.
# This tag requires that the tag HAVE_DOT is set to YES.

DOT_TRANSPARENT        = NO

# Set the DOT_MULTI_TARGETS tag to YES to allow dot to generate multiple output
# files in one run (i.e. multiple -o and -T options on the command line). This
# makes dot run faster, but since only newer versions of dot (>1.8.10) support
# this, this feature is disabled by default.
# The default value is: NO.
# This tag requires that the tag HAVE_DOT is set to YES.

DOT_MULTI_TARGETS      = NO

# If the GENERATE_LEGEND tag is set to YES doxygen will generate a legend page
# explaining the meaning of the various boxes and arrows in the dot generated
# graphs.
# The default value is: YES.
# This tag requires that the tag HAVE_DOT is set to YES.

GENERATE_LEGEND        = YES

# If the DOT_CLEANUP tag is set to YES, doxygen will remove the intermediate dot
# files that are used to generate the various graphs.
# The default value is: YES.
# This tag requires that the tag HAVE_DOT is set to YES.

DOT_CLEANUP            = YES


================================================
FILE: doc/cpp/DoxygenLayout.xml
================================================
<doxygenlayout version="1.0">
  <!-- Customized for gtirb C++ API based on doxygen 1.8.14 -->
  <!-- Navigation index tabs for HTML output -->
  <navindex>
    <tab type="mainpage" visible="yes" title="C++ API Home"/>
    <tab type="user" visible="yes" title="GTIRB Home" url="../index.html"/>
    <tab type="classes" visible="yes" title="C++ API Details">
      <tab type="classlist" visible="yes" title="" intro=""/>
      <tab type="classindex" visible="$ALPHABETICAL_INDEX" title=""/>
      <tab type="hierarchy" visible="yes" title="" intro=""/>
      <tab type="classmembers" visible="yes" title="" intro=""/>
      <tab type="modules" visible="yes" title="" intro=""/>
      <tab type="namespacelist" visible="yes" title="" intro=""/>
      <tab type="namespacemembers" visible="yes" title="" intro=""/>
      <tab type="filelist" visible="yes" title="" intro=""/>
      <tab type="globals" visible="yes" title="" intro=""/>
    </tab>
    <tab type="user" visible="yes" title="API Component Descriptions" url="../md__c_o_m_p_o_n_e_n_t_s.html"/>
  </navindex>

  <!-- Layout definition for a class page -->
  <class>
    <briefdescription visible="yes"/>
    <includes visible="$SHOW_INCLUDE_FILES"/>
    <inheritancegraph visible="$CLASS_GRAPH"/>
    <collaborationgraph visible="$COLLABORATION_GRAPH"/>
    <memberdecl>
      <nestedclasses visible="yes" title=""/>
      <publictypes title=""/>
      <services title=""/>
      <interfaces title=""/>
      <publicslots title=""/>
      <signals title=""/>
      <publicmethods title=""/>
      <publicstaticmethods title=""/>
      <publicattributes title=""/>
      <publicstaticattributes title=""/>
      <protectedtypes title=""/>
      <protectedslots title=""/>
      <protectedmethods title=""/>
      <protectedstaticmethods title=""/>
      <protectedattributes title=""/>
      <protectedstaticattributes title=""/>
      <packagetypes title=""/>
      <packagemethods title=""/>
      <packagestaticmethods title=""/>
      <packageattributes title=""/>
      <packagestaticattributes title=""/>
      <properties title=""/>
      <events title=""/>
      <privatetypes title=""/>
      <privateslots title=""/>
      <privatemethods title=""/>
      <privatestaticmethods title=""/>
      <privateattributes title=""/>
      <privatestaticattributes title=""/>
      <friends title=""/>
      <related title="" subtitle=""/>
      <membergroups visible="yes"/>
    </memberdecl>
    <detaileddescription title=""/>
    <memberdef>
      <inlineclasses title=""/>
      <typedefs title=""/>
      <enums title=""/>
      <services title=""/>
      <interfaces title=""/>
      <constructors title=""/>
      <functions title=""/>
      <related title=""/>
      <variables title=""/>
      <properties title=""/>
      <events title=""/>
    </memberdef>
    <allmemberslink visible="yes"/>
    <usedfiles visible="$SHOW_USED_FILES"/>
    <authorsection visible="yes"/>
  </class>

  <!-- Layout definition for a namespace page -->
  <namespace>
    <briefdescription visible="yes"/>
    <memberdecl>
      <nestednamespaces visible="yes" title=""/>
      <constantgroups visible="yes" title=""/>
      <classes visible="yes" title=""/>
      <typedefs title=""/>
      <enums title=""/>
      <functions title=""/>
      <variables title=""/>
      <membergroups visible="yes"/>
    </memberdecl>
    <detaileddescription title=""/>
    <memberdef>
      <inlineclasses title=""/>
      <typedefs title=""/>
      <enums title=""/>
      <functions title=""/>
      <variables title=""/>
    </memberdef>
    <authorsection visible="yes"/>
  </namespace>

  <!-- Layout definition for a file page -->
  <file>
    <briefdescription visible="yes"/>
    <includes visible="$SHOW_INCLUDE_FILES"/>
    <includegraph visible="$INCLUDE_GRAPH"/>
    <includedbygraph visible="$INCLUDED_BY_GRAPH"/>
    <sourcelink visible="yes"/>
    <memberdecl>
      <classes visible="yes" title=""/>
      <namespaces visible="yes" title=""/>
      <constantgroups visible="yes" title=""/>
      <defines title=""/>
      <typedefs title=""/>
      <enums title=""/>
      <functions title=""/>
      <variables title=""/>
      <membergroups visible="yes"/>
    </memberdecl>
    <detaileddescription title=""/>
    <memberdef>
      <inlineclasses title=""/>
      <defines title=""/>
      <typedefs title=""/>
      <enums title=""/>
      <functions title=""/>
      <variables title=""/>
    </memberdef>
    <authorsection/>
  </file>

  <!-- Layout definition for a group page -->
  <group>
    <briefdescription visible="yes"/>
    <groupgraph visible="$GROUP_GRAPHS"/>
    <memberdecl>
      <nestedgroups visible="yes" title=""/>
      <dirs visible="yes" title=""/>
      <files visible="yes" title=""/>
      <namespaces visible="yes" title=""/>
      <classes visible="yes" title=""/>
      <defines title=""/>
      <typedefs title=""/>
      <enums title=""/>
      <enumvalues title=""/>
      <functions title=""/>
      <variables title=""/>
      <signals title=""/>
      <publicslots title=""/>
      <protectedslots title=""/>
      <privateslots title=""/>
      <events title=""/>
      <properties title=""/>
      <friends title=""/>
      <membergroups visible="yes"/>
    </memberdecl>
    <detaileddescription title=""/>
    <memberdef>
      <pagedocs/>
      <inlineclasses title=""/>
      <defines title=""/>
      <typedefs title=""/>
      <enums title=""/>
      <enumvalues title=""/>
      <functions title=""/>
      <variables title=""/>
      <signals title=""/>
      <publicslots title=""/>
      <protectedslots title=""/>
      <privateslots title=""/>
      <events title=""/>
      <properties title=""/>
      <friends title=""/>
    </memberdef>
    <authorsection visible="yes"/>
  </group>

  <!-- Layout definition for a directory page -->
  <directory>
    <briefdescription visible="yes"/>
    <directorygraph visible="yes"/>
    <memberdecl>
      <dirs visible="yes"/>
      <files visible="yes"/>
    </memberdecl>
    <detaileddescription title=""/>
  </directory>
</doxygenlayout>


================================================
FILE: doc/cpp/README.md
================================================
# Using the C++ Library

We have provided several C++ examples in directory
`gtirb/doc/examples`. See the [Examples page](../examples.html) for more
information.

The remainder of this section provides examples walking through common
tasks using the GTIRB C++ library API.

- [Using the C++ Library](#using-the-c-library)
  - [Building](#building)
    - [Requirements](#requirements)
    - [Building on Windows](#building-on-windows)
    - [As a dependency](#as-a-dependency)
  - [Using the API](#using-the-api)

## Building

### Requirements

To build and install GTIRB, the following requirements should be installed in addition to the [common requirements](../../README.md#requirements):

- [Boost](https://www.boost.org/), version 1.68.0 or later.
  - No version of Ubuntu provides this version of Boost yet; you must build it from source.

### Building on Windows

CMake can optionally use a toolchain file, as generated by
[Microsoft's vcpkg](https://github.com/Microsoft/vcpkg), to find packages like
boost or protobuf on Windows. One way to install GTIRB's dependencies is to run
`vcpkg` before running `cmake`:

```
vcpkg.exe install --triplet x64-windows protobuf boost
```

and pass the path to the toolchain file when executing the CMake command above:

```
    -DCMAKE_TOOLCHAIN_FILE="C:\path\to\vcpkg\scripts\buildsystems\vcpkg.cmake"
```

### As a dependency

Note that, to compile a C++ client that uses the GTIRB library,
you have to inform the compiler and linker where to find GTIRB's
header files and library archives. In addition, the OS also needs to
be informed about where to find GTIRB's dynamic libraries. These files
are located under `include` and `lib` in the build output directory
you picked when running CMake originally. How to do this will depend
on the particular compiler tool chain and context you are working
with.

If the C++ client in question also uses CMake, then it can find gtirb as a dependency by adding this to thier `CMakeLists.txt`:

```cmake
find_package(gtirb REQUIRED)
```

On Linux systems, If GTIRB was installed (perhaps via `make install` or via APT package),
using GTIRB as a library is as simple as specifying `-lgtirb` or similar on your C compiler's command line.

If you choose to install a static build of GTIRB (via `-DGTIRB_BUILD_SHARED_LIBS=OFF`),
then you must provide `-lgtirb_proto` on your command line as well as `-lgtirb`.

## Using the API

See [api-walkthrough.cpp](../api-walkthrough_8cpp-example.html) (in
the repository at `gtirb/doc/examples/api-walkthrough.cpp`) for a
basic introduction to using the GTIRB API in C++.

## Iteration Order
\anchor iteration_order

### Blocks

Iterating over blocks on a ByteInterval will yield them in order of offset,
size, kind, decode mode, and UUID. Iterating over blocks on other containers,
such as Section or Module, will yield them in order of address, size, kind,
decode mode, and UUID.

### Sections and ByteIntervals

Iterating over Sections or ByteIntervals will yield them in order of address,
size, and UUID.

### Iterator Invalidation

Altering a property that affects sort order will not cause iterators to be
invalidated. However, it may cause objects to be visited more than once or
to be skipped completely.


================================================
FILE: doc/dot/gtirb.dot
================================================


================================================
FILE: doc/examples/CMakeLists.txt
================================================
if(CL_API)
  list(APPEND EXAMPLE_FILES_IN "${CMAKE_CURRENT_SOURCE_DIR}/cfg-paths.lisp"
              "${CMAKE_CURRENT_SOURCE_DIR}/data-symbols.lisp"
              "${CMAKE_CURRENT_SOURCE_DIR}/show-cfg.lisp"
  )
endif(CL_API)

if(CXX_API)
  include_directories("${CMAKE_SOURCE_DIR}/include")
  # Find protobuf generated headers in the build directory
  include_directories("${CMAKE_BINARY_DIR}/src/")
  # Find our version.h header file
  include_directories("${CMAKE_BINARY_DIR}/include")

  # Suppress warning from protobuf headers.
  if(${CMAKE_CXX_COMPILER_ID} STREQUAL MSVC)
    add_compile_options(-wd4100)
  endif()

  add_executable(ex-api-walkthrough api-walkthrough.cpp)
  target_link_libraries(ex-api-walkthrough gtirb)
  target_compile_definitions(
    ex-api-walkthrough PRIVATE GTIRB_WRAP_UTILS_IN_NAMESPACE
  )

  add_executable(ex-data-symbols data-symbols.cpp)
  target_link_libraries(ex-data-symbols gtirb)
  target_compile_definitions(
    ex-data-symbols PRIVATE GTIRB_WRAP_UTILS_IN_NAMESPACE
  )

  add_executable(ex-cfg-paths cfg-paths.cpp)
  target_link_libraries(ex-cfg-paths gtirb)
  target_compile_definitions(ex-cfg-paths PRIVATE GTIRB_WRAP_UTILS_IN_NAMESPACE)

  add_executable(ex-functions functions.cpp)
  target_link_libraries(ex-functions gtirb)
  target_compile_definitions(ex-functions PRIVATE GTIRB_WRAP_UTILS_IN_NAMESPACE)

  find_library(CAPSTONE NAMES capstone)
  if(CAPSTONE)
    add_executable(ex-jumps jumps.cpp)
    target_link_libraries(ex-jumps gtirb ${CAPSTONE})
    target_compile_definitions(ex-jumps PRIVATE GTIRB_WRAP_UTILS_IN_NAMESPACE)
  endif()

  list(
    APPEND EXAMPLE_FILES_IN
           "${CMAKE_CURRENT_SOURCE_DIR}/api-walkthrough.cpp"
           "${CMAKE_CURRENT_SOURCE_DIR}/cfg-paths.cpp"
           "${CMAKE_CURRENT_SOURCE_DIR}/data-symbols.cpp"
           "${CMAKE_CURRENT_SOURCE_DIR}/functions.cpp"
           "${CMAKE_CURRENT_SOURCE_DIR}/jumps.cpp"
  )
endif(CXX_API)

if(JAVA_API)
  list(APPEND EXAMPLE_FILES_IN "${CMAKE_CURRENT_SOURCE_DIR}/cfgpaths.java"
              "${CMAKE_CURRENT_SOURCE_DIR}/datasymbols.java"
  )
endif(JAVA_API)

if(PY_API)
  list(APPEND EXAMPLE_FILES_IN "${CMAKE_CURRENT_SOURCE_DIR}/cfg-paths.py"
              "${CMAKE_CURRENT_SOURCE_DIR}/data-symbols.py"
              "${CMAKE_CURRENT_SOURCE_DIR}/show-cfg.py"
  )
endif(PY_API)

macro(move_filename file_list newdir)
  foreach(src_file ${${file_list}})
    get_filename_component(src_file_name "${src_file}" NAME)
    list(REMOVE_ITEM ${file_list} "${src_file}")
    list(APPEND ${file_list} "${newdir}/${src_file_name}")
  endforeach()
endmacro()

set(EXAMPLE_FILES ${EXAMPLE_FILES_IN})
move_filename(EXAMPLE_FILES ${CMAKE_CURRENT_BINARY_DIR})

if(NOT "${CMAKE_CURRENT_SOURCE_DIR}" STREQUAL "${CMAKE_CURRENT_BINARY_DIR}")
  foreach(_inmd ${EXAMPLE_FILES_IN})
    get_filename_component(_outmd "${_inmd}" NAME)
    add_custom_command(
      OUTPUT ${_outmd}
      WORKING_DIRECTORY ${CMAKE_CURRENT_BINARY_DIR}
      DEPENDS ${_inmd}
      COMMAND ${CMAKE_COMMAND} -E copy ${_inmd} "${_outmd}"
      COMMENT "copying ${_outmd}"
      VERBATIM
    )
  endforeach()
endif()

add_custom_target(
  doc_examples
  DEPENDS ${EXAMPLE_FILES}
  COMMENT "copying examples to output"
  VERBATIM
)

add_dependencies(doc doc_examples)


================================================
FILE: doc/examples/api-walkthrough.cpp
================================================
#include <gtirb/gtirb.hpp>
#include <boost/uuid/uuid_io.hpp>
#include <fstream>
#include <iostream>

using namespace gtirb;

int main() {
  // BEGIN
  //
  // ### Initialization for AuxData usage
  //
  // To make use of the auxiliary data mechanism, each schema that is
  // intended to be used must be registered with the API before doing
  // anything else with GTIRB. Typically, this is easiest to do as one
  // of the first steps in main().
  AuxDataContainer::registerAuxDataType<gtirb::schema::Types>();
  //
  // ### Populating the IR
  //
  // GTIRB representation objects have class `gtirb::IR`, and are created within
  // a context object (`gtirb::Context`). Freeing the context will also destroy
  // all the objects within it.
  Context C;
  auto* Ir = IR::Create(C);

  // Every IR holds a set of modules (`gtirb::Module`).
  auto* M = Module::Create(C, "example");
  Ir->addModule(M);
  // Could also have written: auto* M = Ir->addModule(C);

  // Every module holds a set of sections (`gtirb::Section`).
  auto* S = Section::Create(C, ".text");
  M->addSection(S);
  // Could also have written: auto* S = M->addSection(C, ".text");

  // Every section has a set of byte intervals (`gtirb::ByteInterval`).
  auto* BI = ByteInterval::Create(C, Addr(2048), 466);
  S->addByteInterval(BI);
  // Could also have written: auto* BI = S->addByteInterval(C, Addr(2048), 466);

  // Create some data objects. These only define the layout and do not directly
  // store any data.
  auto* D1 = DataBlock::Create(C, 6);
  BI->addBlock(0, D1);
  auto* D2 = DataBlock::Create(C, 2);
  BI->addBlock(6, D2);
  // The actual data is stored in the blocks' byte interval:
  std::array<uint8_t, 8> Bytes{1, 0, 2, 0, 115, 116, 114, 108};
  BI->insertBytes(const_cast<const ByteInterval*>(BI)->bytes_begin<uint8_t>(),
                  Bytes.begin(), Bytes.end());
  // Symbols (`gtirb::Symbol`) associate a name with a block in the IR, such as
  // code blocks, data blocks, or proxy blocks. They can optionally store an
  // address instead.
  [[maybe_unused]] auto* Sym1 = M->addSymbol(Symbol::Create(C, D1, "data1"));
  [[maybe_unused]] auto* Sym2 = M->addSymbol(Symbol::Create(C, D2, "data2"));
  // GTIRB can store multiple symbols with the same address or referent.
  M->addSymbol(Symbol::Create(C, D2, "duplicateReferent"));
  M->addSymbol(Symbol::Create(C, Addr(2048), "duplicateName"));
  M->addSymbol(Symbol::Create(C, Addr(4096), "duplicateName"));
  // Basic blocks are stored as `gtirb::CodeBlock`s. Like data blocks, code
  // blocks reference data in a byte interval but do not directly hold any data
  // themselves. GTIRB does not directly represent instructions.
  auto* B1 = CodeBlock::Create(C, 4);
  BI->addBlock(12, B1);
  auto* B2 = CodeBlock::Create(C, 6);
  BI->addBlock(16, B2);
  // GTIRB has an interprocedural control flow graph (`gtirb::CFG`) to track
  // relations between code blocks. The `CFG` can be populated with edges to
  // denote control flow.
  auto& Cfg = Ir->getCFG();
  auto E = *addEdge(B1, B2, Cfg);
  // Edges can have labels, indicating the type of control flow:
  Cfg[E] = std::make_tuple(ConditionalEdge::OnFalse, DirectEdge::IsDirect,
                           EdgeType::Fallthrough);
  // Symbolic expressions indicate that the value of a range of bytes depends on
  // the value of a symbol.
  BI->addSymbolicExpression(14, SymAddrConst{0, Sym1});
  // Finally, auxiliary data can be used to store additional information at the
  // IR and module level. A `gtirb::AuxData` object can store integers, strings,
  // GTIRB types such as `gtirb::Addr` and `gtirb::UUID`, and various containers
  // over these types. There are predefined AuxData schema for you to use, but
  // you can also use your own custom AuxData schema. Here is use of a
  // predefined schema, `gtirb::schema::Types`:
  M->addAuxData<gtirb::schema::Types>(
      {{D1->getUUID(), "string"}, {D2->getUUID(), "uleb128"}});
  //
  // ### Querying the IR
  //
  // Symbols can be looked up by address or name.  Any number of symbols can
  // share an address or name, so be prepared to deal with multiple results.
  for (const auto& Sym : M->findSymbols(Addr(2054))) {
    [[maybe_unused]] const auto& _ = Sym;
    assert(Sym.getAddress() == Addr(2054));
    assert(Sym.getName() == "data2" || Sym.getName() == "duplicateReferent");
    assert(Sym.getReferent<DataBlock>() == nullptr ||
           Sym.getReferent<DataBlock>() == D2);
  }
  for (const auto& Sym : M->findSymbols("duplicateName")) {
    [[maybe_unused]] const auto& _ = Sym;
    assert(Sym.getName() == "duplicateName");
    assert(Sym.getAddress() == Addr(2048) || Sym.getAddress() == Addr(4096));
  }
  // Use a symbol's referent (either a Block or DataObject) to get more
  // information about the object to which the symbol points.
  [[maybe_unused]] auto* Referent = Sym1->getReferent<DataBlock>();
  assert(Referent != nullptr);
  assert(Referent->getAddress() == Addr(2054));
  assert(Referent->getSize() == 2);
  assert(Referent->getByteInterval() == BI);
  assert(Referent->getOffset() == 6);
  // Alternatively, blocks can be looked up by an address contained within the
  // object. Any number of blocks may overlap and contain an address, so be
  // prepared to deal with multiple results.
  auto Blocks = M->findBlocksAt(Addr(2048), Addr(4096));
  assert(std::distance(Blocks.begin(), Blocks.end()) == 4);
  // The CFG uses
  // [boost::graph](https://www.boost.org/doc/libs/1_68_0/libs/graph/doc/).
  // GTIRB also provides a convenience function for iterating over blocks:
  for (const auto& B : blocks(Cfg)) {
    std::cout << "Block at address " << B.getAddress() << std::endl;
  }
  // To use boost::graph directly, you'll need to convert blocks into
  // `vertex_descriptor`s:
  auto [VerticesBegin, VerticesEnd] = boost::vertices(Cfg);
  for (const auto& Vertex :
       boost::make_iterator_range(VerticesBegin, VerticesEnd)) {
    if (Cfg[Vertex] == B2) {
      std::cout << "B2's vertex descriptor is: " << Vertex << std::endl;
    }
  }
  // And once you have those, you can use `edge_descriptor`s to look up labels
  // and the source/target blocks:
  auto [EdgesBegin, EdgesEnd] = boost::edges(Cfg);
  for (const auto& Edge : boost::make_iterator_range(EdgesBegin, EdgesEnd)) {
    auto V1 = boost::source(Edge, Cfg);
    auto V2 = boost::target(Edge, Cfg);
    std::cout << "Edge: " << Cfg[V1] << " => " << Cfg[V2] << std::endl;

    auto Label = *Cfg[Edge];
    std::cout << "Conditional? "
              << (std::get<ConditionalEdge>(Label) == ConditionalEdge::OnTrue)
              << std::endl;
    std::cout << "Direct? "
              << (std::get<DirectEdge>(Label) == DirectEdge::IsDirect)
              << std::endl;
    std::cout << "Fallthrough? "
              << (std::get<EdgeType>(Label) == EdgeType::Fallthrough)
              << std::endl;
  }
  // Aux data can be retrieved based on the schema and queried upon.
  auto* typesMap = M->getAuxData<gtirb::schema::Types>();
  if (typesMap) {
    for (const auto& [DataBlockID, BlockType] : *typesMap) {
      std::cout << "Data block with UUID " << DataBlockID << " is of type "
                << BlockType << "!";
    }
  }
  //
  // ### Serialization
  //
  // Serialize IR to a file with `gtirb::IR::save`.
  std::ofstream Out("path/to/file");
  Ir->save(Out);
  // Deserialize from a file with `gtirb::IR::load`.
  std::ifstream In("path/to/file");
  [[maybe_unused]] auto& NewIR = *IR::load(C, In);
  // END
  return 0;
}


================================================
FILE: doc/examples/cfg-paths.cpp
================================================
// An example program which opens an IR and prints every control-flow path
// from some basic block to another basic block.

#include <gtirb/gtirb.hpp>
#include <fstream>
#include <iomanip>
#include <iostream>
#include <set>
#include <vector>

using namespace gtirb;

// Print Addrs in hex format
std::ostream& operator<<(std::ostream& Os, Addr A) {
  auto Flags = Os.flags();
  Os << "0x" << std::hex << std::setw(8) << std::setfill('0') << uint64_t(A);
  Os.flags(Flags);
  return Os;
}

// Depth-first search of a graph, printing all paths between two given vertices.
// boost::graph::depth_first_search is not a good fit for this, because we
// need to visit nodes multiple times (while still avoiding cycles). So we
// have to implement our own.
class PrintPathsVisitor {
public:
  using Vertex = CFG::vertex_descriptor;

  PrintPathsVisitor(const CFG& G, const CodeBlock& B)
      : Graph(G), Target(*getVertex(&B, G)) {}

  void visit(Vertex V) {
    // Mark as visited to avoid cycles
    Visited.insert(V);

    // At target, print the path
    if (V == Target) {
      for (auto U : Path) {
        std::cout << dyn_cast<CodeBlock>(Graph[U])->getAddress() << ", ";
      }
      std::cout << dyn_cast<CodeBlock>(Graph[Target])->getAddress() << "\n";
    } else {
      // Otherwise, extend the path and keep searching.
      Path.push_back(V);
      // Check all outgoing edges from this vertex
      auto [Begin, End] = out_edges(V, Graph);
      for (auto It = Begin; It != End; It++) {
        // If edge target has not been visited, do so now
        auto T = target(*It, Graph);
        if (Visited.find(T) == Visited.end()) {
          visit(T);
        }
      }
      Path.pop_back();
    }

    // Unmark the node so it can be visited again in other paths.
    Visited.erase(V);
  }

  const CFG& Graph;
  Vertex Target;
  std::vector<Vertex> Path;
  std::set<Vertex> Visited;
};

int main(int argc, char** argv) {
  // Create a context to manage memory for gtirb objects
  Context C;

  // Load the IR
  IR* I = nullptr;

  if (argc == 4) {
    std::ifstream in(argv[1]);
    if (auto IoE = IR::load(C, in); IoE)
      I = *IoE;
  }

  if (!I)
    return EXIT_FAILURE;

  // Addresses of source and target blocks
  Addr Source(std::stoul(argv[2], nullptr, 16));
  Addr Target(std::stoul(argv[3], nullptr, 16));

  // Search for the requested blocks in the first module
  const auto& Mod = *I->modules_begin();
  const auto& Cfg = I->getCFG();
  const CodeBlock *SourceBlock, *TargetBlock;

  if (auto Range = Mod.findCodeBlocksAt(Source); !Range.empty()) {
    SourceBlock = &*Range.begin();
  } else {
    std::cerr << "No block at source address " << Source << "\n";
    exit(EXIT_FAILURE);
  }

  if (auto Range = Mod.findCodeBlocksAt(Target); !Range.empty()) {
    TargetBlock = &*Range.begin();
  } else {
    std::cerr << "No block at target address " << Target << "\n";
    exit(EXIT_FAILURE);
  }

  std::cout << "Paths from " << SourceBlock->getAddress() << " to "
            << TargetBlock->getAddress() << "\n";
  // Print paths
  PrintPathsVisitor(Cfg, *TargetBlock).visit(*getVertex(SourceBlock, Cfg));
  return EXIT_SUCCESS;
}


================================================
FILE: doc/examples/cfg-paths.lisp
================================================
;;;; cfg-paths.lisp --- Print the shortest path between two blocks
;;;
;;; To run this example, do the following.
;;;
;;; 1. Install all required packages with quicklisp.
;;;
;;;    NOTE: you might need to install the :graph library from source
;;;          as the `all-paths' function isn't in the quicklisp
;;;          version at the time  of writing of this example.
;;;
;;;    (mapcar #'ql:quickload '(:gt :gtirb :graph)
;;;
;;; 2. Run ddisasm to disassemble a binary to GTIRB.
;;;
;;;    $ echo 'main(){puts("hello world");}'|gcc -x c - -o /tmp/hello
;;;    $ ddisasm /tmp/hello --ir /tmp/hello.gtirb
;;;
;;; 3. Evaluate this file using the path of the GTIRB file produced by
;;;    ddisasm and the addresses of two basic blocks.
;;;
(defpackage :cfg-paths
  (:use :gt :gtirb :graph)
  (:shadow :symbol :size :copy))
(in-package :cfg-paths)

(defun cfg-paths (path from to)
  "Return all paths in the cfg of the GTIRB file from FROM to TO.
FROM and TO are the addresses of the start of blocks."
  (let ((ir (read-gtirb path)))
    (flet ((block-uuid-at (address)
             (uuid (find-if (lambda (it) (typep it 'code-block))
                            (at-address ir address)))))
      (all-paths (cfg ir) (block-uuid-at from) (block-uuid-at to)))))


================================================
FILE: doc/examples/cfg-paths.py
================================================
#!/usr/bin/python
#
# An example program which opens an IR and prints all paths between
# two blocks.
#
# To run this example, do the following.
#
# 1. Install the gtirb package from Pypi.
#
# 2. Run ddisasm to disassemble a binary to GTIRB.
#
#    $ echo 'main(){puts("hello world");}'|gcc -x c - -o /tmp/hello
#    $ ddisasm /tmp/hello --ir /tmp/hello.gtirb
#
# 3. Execute the following command to run the program on the
#    serialized GTIRB data.
#
#    $ ./doc/examples/cfg-paths.py /tmp/hello.gtirb
import sys

import networkx as nx

import gtirb

if len(sys.argv) < 4:
    print(f"Usage: {sys.argv[0]} /path/to/file.gtirb source target")
    quit(1)

ir = gtirb.ir.IR.load_protobuf(sys.argv[1])
G = nx.DiGraph()

for edge in ir.cfg:
    if isinstance(edge.target, gtirb.block.ProxyBlock):
        # Represent ProxyBlocks (which don't have an address) with their UUID.
        G.add_edge(edge.source.address, edge.target.uuid)
    else:
        G.add_edge(edge.source.address, edge.target.address)

for path in nx.all_simple_paths(G, int(sys.argv[2]), int(sys.argv[3])):
    print(path)


================================================
FILE: doc/examples/cfgpaths.java
================================================
// An example program which opens an IR and prints every control-flow
// path from some basic block to another basic block.
//
// To run this example, do the following.
//
// 1. Install the protobuf compiler (protoc) from
//    https://github.com/protocolbuffers/protobuf/releases (if you have
//    not already done so).
//
// 2. Download the protobuf Java runtime from
//    https://mvnrepository.com/artifact/com.google.protobuf/protobuf-java
//    and save it somewhere suitable.
//
// 3. Generate Java message definitions.
//
//    $ mkdir -p java $ for f in src/proto/*.proto; do
//         protoc -Isrc/proto --java_out=java $f
//      done
//
//    This will create a subdirectory java/proto/, containing a
//    number of files with names of the form <bn>OuterClass.java:
//    one for each <bn>.proto in src/proto/.
//
// 4. Compile the Java message definitions, making sure the protobuf
//    Java runtime .jar file is in your CLASSPATH.
//
//    $ mkdir -p java/classfiles
//    $ CLASSPATH=<path/to/protobuf_jar> \
//         javac -d java/classfiles java/proto/*.java
//
// 5. Compile the datasymbols class defined in this file, making sure
//    your CLASSPATH contains both the Java runtime .jar file and the
//    compiled Java message definition classes.
//    (Note that the path separator is OS-dependent.)
//
//    $ CLASSPATH=<path/to/protobuf_jar>:./java/classfiles/ \
//         javac doc/examples/cfgpaths.java
//
// 6. Execute the following command to run the program on the
//    serialized GTIRB data located at <path-to-ir> printing every
//    control-flow path between the block with address <source-addr>
//    and the block with address <target-addr>.
//
//    $  CLASSPATH=<path/to/protobuf_jar>:./java/classfiles/:doc/examples/ \
//          java cfgpaths <path-to-ir>  <source-addr> <target-addr>

import com.google.protobuf.ByteString;
import java.io.FileInputStream;
import java.io.FileNotFoundException;
import java.io.IOException;
import java.io.PrintStream;
import java.lang.Long;
import java.util.*;
import proto.BlockOuterClass.Block;
import proto.CFGOuterClass.CFG;
import proto.CFGOuterClass.Edge;
import proto.IROuterClass.IR;
import proto.ModuleOuterClass.Module;

class cfgpaths {

    // Avoid duplicated effort by caching the uuids of Blocks from
    // which we have the target is unreachable.
    static Set<ByteString> unreachability_cache = new HashSet<ByteString>();

    // Print one path.
    static void printPath(Stack<Long> path) {
        Set<Long> pathset = new HashSet<Long>();
        pathset.addAll(path);
        //	assert path.size() == pathset.size();
        for (Long addr : path) {
            System.out.print(String.format("0x%08X ", addr));
        }
        System.out.println();
    }

    // Use depth-first search to print all paths from the Block with
    // uuid src to targ to the Block with uuid targ.
    static int printPathsRec(ByteString src, ByteString targ,
                             Map<ByteString, Block> blocks,
                             Map<ByteString, Set<ByteString>> edges,
                             Set<ByteString> visited, Stack<Long> path) {

        int printed = 0;
        path.push(blocks.get(src).getAddress());
        visited.add(src);
        if (src.equals(targ)) {
            printPath(path);
            printed = 1;
        } else {
            for (ByteString next : edges.get(src)) {
                if (!visited.contains(next) &&
                    !unreachability_cache.contains(next)) {
                    printed +=
                        printPathsRec(next, targ, blocks, edges, visited, path);
                }
            }
        }
        visited.remove(src);
        path.pop();
        if (printed == 0) {
            unreachability_cache.add(src);
        }
        return printed;
    }

    // Print all paths from source to target in cfg.
    static void printPaths(Block source, Block target, CFG cfg) {
        Map<ByteString, Block> blocks = new HashMap<ByteString, Block>();
        Map<ByteString, Set<ByteString>> edges =
            new HashMap<ByteString, Set<ByteString>>();
        Set<ByteString> visited = new HashSet<ByteString>();

        for (Block b : cfg.getBlocksList()) {
            blocks.put(b.getUuid(), b);
            edges.put(b.getUuid(), new HashSet<ByteString>());
        }

        for (Edge e : cfg.getEdgesList()) {
            edges.get(e.getSourceUuid()).add(e.getTargetUuid());
        }

        int numpaths =
            printPathsRec(source.getUuid(), target.getUuid(), blocks, edges,
                          new HashSet<ByteString>(), new Stack<Long>());
        System.out.println(numpaths + " paths found.");
    }

    static Block findBlockByAddr(Long addr, CFG cfg) {
        for (Block b : cfg.getBlocksList()) {
            if (b.getAddress() == addr) {
                return b;
            }
        }
        return Block.getDefaultInstance();
    }

    public static void main(String[] args) {

        IR ir = IR.getDefaultInstance();
        Block defaultblock = Block.getDefaultInstance();
        Block from_block = defaultblock;
        Block to_block = defaultblock;
        CFG cfg = CFG.getDefaultInstance();
        boolean blocks_found = false;
        Long from_addr = -1L;
        Long to_addr = -1L;

        if (args.length < 3) {
            System.err.println(
                "Requires three arguments: <gtirb-file> <from-address> <to-address> ");
            System.exit(-1);
        }

        // Read serialized GTIRB data from the specified file.
        try {
            ir = IR.parseFrom(new FileInputStream(args[0]));
        } catch (FileNotFoundException fe) {
            System.err.println("File not found: " + args[0]);
            System.exit(-1);
        } catch (IOException ie) {
            System.err.println("Problem reading file: " + args[0]);
            System.exit(-1);
        }

        try {
            from_addr = Long.decode(args[1]);
            to_addr = Long.decode(args[2]);
        } catch (NumberFormatException nfe) {
            System.err.println(
                "Specify block addresses as numbers in decimal, hexadecimal, or octal format.");
            System.exit(-1);
        }

        // Check one module at a time (the GTIRB CFGs do not have
        // edges across module boundaries, so if the specified blocks
        // are in different modules there cannot be any paths between
        // them).
        for (Module m : ir.getModulesList()) {
            cfg = m.getCfg();
            from_block = findBlockByAddr(from_addr, cfg);
            to_block = findBlockByAddr(to_addr, cfg);

            // Neither block is in this module: go on to next module.
            if (from_block == defaultblock && to_block == defaultblock) {
                System.out.println("Blocks not found in module " + m.getName());
                continue;
            }

            // One block is in this module and the other isn't: error.
            if (to_block == defaultblock) {
                System.err.println(String.format(
                    "The block at from-address 0x%08X is located in a module that does not contain a block at to-address 0x%08X.  The block at 0x%08X may be in a different module, or may not exist.",
                    from_addr, to_addr, to_addr));
                System.exit(-1);
            }
            if (from_block == defaultblock) {
                System.err.println(String.format(
                    "The block at  to-address 0x%08X is located in a module that does not contain a block at from-address 0x%08X. The block at 0x%08X may be in a different module, or may not exist.",
                    to_addr, from_addr, from_addr));
                System.exit(-1);
            }

            // At this point, both to_block and from_block must be
            // present in this module.
            blocks_found = true;
            System.out.println("Blocks found in module " + m.getName());
            printPaths(from_block, to_block, cfg);
            break;
        }

        // If never found either block, notify user.
        if (!blocks_found) {
            System.err.println(String.format(
                "No blocks found at either of the specified addresses: \n to-address: 0x%08X \n from-address: 0x%08X",
                to_addr, from_addr));
            System.exit(-1);
        }
    }
}


================================================
FILE: doc/examples/data-symbols.cpp
================================================
// An example program which opens an IR and prints information about all
// symbols pointing to data.

#include <gtirb/gtirb.hpp>
#include <fstream>
#include <iomanip>
#include <iostream>

using namespace gtirb;

// Print Addrs in hex format
std::ostream& operator<<(std::ostream& Os, Addr A) {
  auto Flags = Os.flags();
  Os << "0x" << std::hex << std::setw(8) << std::setfill('0') << uint64_t(A);
  Os.flags(Flags);
  return Os;
}

int main(int argc, char** argv) {
  // Create a context to manage memory for gtirb objects
  Context C;

  // Load the IR
  IR* I = nullptr;

  if (argc == 2) {
    std::ifstream in(argv[1]);
    if (auto IoE = IR::load(C, in); IoE)
      I = *IoE;
  }

  if (!I)
    return EXIT_FAILURE;

  for (const auto& M : I->modules()) {
    std::cout << "Module " << M.getName() << "\n";
    // Examine all symbols in the module
    for (const auto& Sym : M.symbols()) {
      if (auto* Ref = Sym.getReferent<DataBlock>(); Ref != nullptr) {
        // If the symbol refers to data, print some information about it
        std::cout << Sym.getName() << ":\t" << Ref->getAddress() << "\t"
                  << Ref->getSize() << " bytes\n";
      }
    }
  }
  return EXIT_SUCCESS;
}


================================================
FILE: doc/examples/data-symbols.lisp
================================================
;;;; data-symbols.lisp --- Print the names of all symbols pointing to data
;;;
;;; To run this example, do the following.
;;;
;;; 1. Install the gtirb and gtirb/dot packages with quicklisp
;;;
;;;    (mapcar #'ql:quickload '(:gt :gtirb)
;;;
;;; 2. Run ddisasm to disassemble a binary to GTIRB.
;;;
;;;    $ echo 'main(){puts("hello world");}'|gcc -x c - -o /tmp/hello
;;;    $ ddisasm /tmp/hello --ir /tmp/hello.gtirb
;;;
;;; 3. Evaluate this file using the path of the GTIRB file produced by
;;;    ddisasm and the addresses of two basic blocks.
;;;
(defpackage :data-symbols
  (:use :gt :gtirb)
  (:shadow :symbol :size))
(in-package :data-symbols)
(in-readtable :curry-compose-reader-macros)

(defun data-symbols (path)
  "Print the names of all symbols pointing to data in GTIRB at PATH."
  (nest (format t "~{~a~%~}")
        (mapcar #'name)
        (remove-if-not [{typep _ 'data-block} #'payload])
        (mappend #'symbols (modules (read-gtirb path)))))


================================================
FILE: doc/examples/data-symbols.py
================================================
#!/usr/bin/python
#
# An example program which opens an IR and prints information about all
# symbols pointing to data.
#
# To run this example, do the following.
#
# 1. Install the gtirb package from Pypi.
#
# 2. Run ddisasm to disassemble a binary to GTIRB.
#
#    $ echo 'main(){puts("hello world");}'|gcc -x c - -o /tmp/hello
#    $ ddisasm /tmp/hello --ir /tmp/hello.gtirb
#
# 3. Execute the following command to run the program on the
#    serialized GTIRB data.
#
#    $ ./doc/examples/data-symbols.py /tmp/hello.gtirb
import sys

import gtirb

if len(sys.argv) < 2:
    print(f"Usage: {sys.argv[0]} /path/to/file.gtirb")
    quit(1)

ir = gtirb.ir.IR.load_protobuf(sys.argv[1])

for m in ir.modules:
    for s in m.symbols:
        ref = s.referent
        if isinstance(ref, gtirb.block.DataBlock):
            print(s.name)


================================================
FILE: doc/examples/datasymbols.java
================================================
// An example program which opens an IR and prints information about all
// symbols pointing to data.
//
// To run this example, do the following.
//
// 1. Install the protobuf compiler (protoc) from
//    https://github.com/protocolbuffers/protobuf/releases (if you have
//    not already done so).
//
// 2. Download the protobuf Java runtime from
//    https://mvnrepository.com/artifact/com.google.protobuf/protobuf-java
//    and save it somewhere suitable.
//
// 3. Generate Java message definitions.
//
//    $ mkdir -p java $ for f in src/proto/*.proto; do
//         protoc -Isrc/proto --java_out=java $f
//      done
//
//    This will create a subdirectory java/proto/, containing a
//    number of files with names of the form <bn>OuterClass.java:
//    one for each <bn>.proto in src/proto/.
//
// 4. Compile the Java message definitions, making sure the protobuf
//    Java runtime .jar file is in your CLASSPATH.
//
//    $ mkdir -p java/classfiles
//    $ CLASSPATH=<path/to/protobuf_jar> \
//         javac -d java/classfiles java/proto/*.java
//
// 5. Compile the datasymbols class defined in this file, making sure
//    your CLASSPATH contains both the Java runtime .jar file and the
//    compiled Java message definition classes.
//    (Note that the path separator is OS-dependent.)
//
//    $ CLASSPATH=<path/to/protobuf_jar>:./java/classfiles/ \
//         javac -classpath  doc/examples/datasymbols.java
//
// 6. Execute the following command to run the program on the
//    serialized GTIRB data located at <path-to-ir>.
//
//    $  CLASSPATH=<path/to/protobuf_jar>:./java/classfiles/:doc/examples/ \
//          java datasymbols <path-to-ir>

import com.google.protobuf.ByteString;
import java.io.FileInputStream;
import java.io.FileNotFoundException;
import java.io.IOException;
import java.io.PrintStream;
import java.lang.Long;
import java.util.*;
import proto.DataObjectOuterClass.DataObject;
import proto.IROuterClass.IR;
import proto.ModuleOuterClass.Module;
import proto.SymbolOuterClass.Symbol;

class datasymbols {

    public static void main(String[] args) {

        IR ir = IR.getDefaultInstance();
        DataObject data_obj;

        if (args.length < 1) {
            System.err.println("No GTIRB file specified.");
            System.exit(-1);
        }

        // Read serialized GTIRB data from the specified file.
        try {
            ir = IR.parseFrom(new FileInputStream(args[0]));
        } catch (FileNotFoundException fe) {
            System.err.println("File not found: " + args[0]);
            System.exit(-1);
        } catch (IOException ie) {
            System.err.println("Problem reading file: " + args[0]);
            System.exit(-1);
        }

        for (Module m : ir.getModulesList()) {

            // Print the name of each Module.
            System.out.println("Module " + m.getName());

            // Make a map uuid->DataObject for the Module.
            Map<Long, DataObject> datamap = m.getDataMap();
            Map<ByteString, DataObject> data_objects =
                new HashMap<ByteString, DataObject>();
            for (DataObject d : datamap.values()) {
                data_objects.put(d.getUuid(), d);
            }

            // Examine all symbols in the module
            for (Symbol sym : m.getSymbolsList()) {
                data_obj = data_objects.get(sym.getReferentUuid());
                if (data_obj != null) {
                    // If the symbol refers to data, print some information
                    // about it
                    System.out.println(String.format(
                        "%s:\t0x%08X\t %d bytes", sym.getName(),
                        data_obj.getAddress(), data_obj.getSize()));
                }
            }
        }
    }
}


================================================
FILE: doc/examples/functions.cpp
================================================
// An example program which opens and IR and prints information about
// functions.

#include <gtirb/gtirb.hpp>
#include <boost/uuid/uuid_io.hpp>
#include <fstream>
#include <iomanip>
#include <iostream>
#include <map>

using namespace gtirb;

// Print Addrs in hex format
std::ostream& operator<<(std::ostream& Os, Addr A) {
  auto Flags = Os.flags();
  Os << "0x" << std::hex << std::setw(8) << std::setfill('0') << uint64_t(A);
  Os.flags(Flags);
  return Os;
}

void register_aux_data_types() {
  using namespace gtirb::schema;
  AuxDataContainer::registerAuxDataType<FunctionEntries>();
  AuxDataContainer::registerAuxDataType<FunctionBlocks>();
}

int main(int argc, char** argv) {
  // Register the AuxData we'll want to use.
  register_aux_data_types();

  // Create a context to manage memory for gtirb objects
  Context C;

  // Load the IR
  IR* I = nullptr;

  if (argc == 2) {
    std::ifstream in(argv[1]);
    if (auto IoE = IR::load(C, in); IoE)
      I = *IoE;
  }

  if (!I)
    return EXIT_FAILURE;

  // Load function information from AuxData.
  // This information is not guaranteed to be present. For the purposes of
  // this example we assume that it exists, but real code should check for
  // nullptr in the return value of getAuxData.
  auto& FunctionEntries =
      *(I->modules_begin()->getAuxData<gtirb::schema::FunctionEntries>());
  auto& FunctionBlocks =
      *(I->modules_begin()->getAuxData<gtirb::schema::FunctionBlocks>());

  // Print function information
  for (auto& [Function, Entries] : FunctionEntries) {

    // Note: this prints out the function's UUID.
    std::cout << boost::uuids::to_string(Function) << "\n";

    // Print information about entry points.
    // TODO: add symbols
    std::cout << "  Entries:\n";
    for (auto EntryUUID : Entries) {
      auto EntryNode = Node::getByUUID(C, EntryUUID);
      assert(EntryNode);
      auto EntryBlock = dyn_cast_or_null<CodeBlock>(EntryNode);
      assert(EntryBlock);
      std::cout << "    " << EntryBlock->getAddress() << "\n";
    }

    // Examine all blocks in the function.
    std::cout << "  Blocks:\n";
    auto It = FunctionBlocks.find(Function);
    assert(It != FunctionBlocks.end());
    auto& Blocks = It->second;
    for (auto BlockUUID : Blocks) {
      auto BlockNode = Node::getByUUID(C, BlockUUID);
      assert(BlockNode);
      auto Block = dyn_cast_or_null<CodeBlock>(BlockNode);
      assert(Block);
      std::cout << "    " << Block->getAddress() << "\n";
    }
  }
  return EXIT_SUCCESS;
}


================================================
FILE: doc/examples/jumps.cpp
================================================
// An example program which opens an IR and prints information about every
// jump instruction.

#include <gtirb/gtirb.hpp>
#include <capstone/capstone.h>
#include <fstream>
#include <iomanip>
#include <iostream>

using namespace gtirb;

// Print Addrs in hex format
std::ostream& operator<<(std::ostream& Os, Addr A) {
  auto Flags = Os.flags();
  Os << "0x" << std::hex << std::setw(8) << std::setfill('0') << uint64_t(A);
  Os.flags(Flags);
  return Os;
}

int main(int argc, char** argv) {
  // Create a context to manage memory for gtirb objects
  Context C;

  // Load the IR
  IR* Ir = nullptr;

  if (argc == 2) {
    std::ifstream in(argv[1]);
    if (auto IoE = IR::load(C, in); IoE)
      Ir = *IoE;
  }

  if (!Ir)
    return EXIT_FAILURE;

  // Initialize capstone for decoding instructions.
  csh CsHandle;
  [[maybe_unused]] int Ret = cs_open(CS_ARCH_X86, CS_MODE_64, &CsHandle);
  assert(Ret == CS_ERR_OK);
  cs_option(CsHandle, CS_OPT_DETAIL, CS_OPT_ON);

  // Examine all blocks in the first module
  for (const auto& B : blocks(Ir->getCFG())) {
    // Get the contents of the block and decode with capstone
    cs_insn* Insn;
    size_t count =
        cs_disasm(CsHandle, B.rawBytes<uint8_t>(), B.getSize(),
                  (uint64_t)B.getAddress().value_or(Addr(0)), 0, &Insn);

    // Exception-safe cleanup of instructions
    std::unique_ptr<cs_insn, std::function<void(cs_insn*)>> freeInsn(
        Insn, [count](cs_insn* i) { cs_free(i, count); });

    // Examine all instructions in the block
    for (size_t I = 0; I < count; I++) {
      const auto& Inst = Insn[I];
      auto& Detail = *Inst.detail;
      for (int G = 0; G < Detail.groups_count; G++) {
        // Print jump instructions
        if (Detail.groups[G] == CS_GRP_JUMP) {
          std::cout << Addr(Inst.address) << ": " << Inst.mnemonic << "\t";
          auto& Op = Detail.x86.operands[0];
          if (Op.type == X86_OP_IMM) {
            std::cout << Addr(Op.imm) << "\n";
          } else {
            std::cout << "<indirect>\n";
          }
          break;
        }
      }
    }
  }
  return EXIT_SUCCESS;
}


================================================
FILE: doc/examples/show-cfg.lisp
================================================
;;;; show-cfg.lisp --- An example program which opens an IR and draws the CFG
;;;
;;; To run this example, do the following.
;;;
;;; 1. Install the gtirb and gtirb/dot packages with quicklisp
;;;
;;;    (ql:quickload :gtirb/dot)
;;;
;;; 2. Run ddisasm to disassemble a binary to GTIRB.
;;;
;;;    $ echo 'main(){puts("hello world");}'|gcc -x c - -o /tmp/hello
;;;    $ ddisasm /tmp/hello --ir /tmp/hello.gtirb
;;;
;;; 3. Evaluate this file.
;;;
;;; 4. Process the resultant dot file into a png
;;;
;;;    $ cat /tmp/hello.dot|dot -Tpng > /tmp/hello.png
;;;
(in-package :gtirb/dot)
(to-dot-file (read-gtirb "/tmp/hello.gtirb") "/tmp/hello.dot")


================================================
FILE: doc/examples/show-cfg.py
================================================
#!/usr/bin/python
#
# An example program which opens an IR and draws the CFG to the screen.
#
# To run this example, do the following.
#
# 1. Install the gtirb package from Pypi.
#
# 2. Run ddisasm to disassemble a binary to GTIRB.
#
#    $ echo 'main(){puts("hello world");}'|gcc -x c - -o /tmp/hello
#    $ ddisasm /tmp/hello --ir /tmp/hello.gtirb
#
# 3. Execute the following command to run the program on the
#    serialized GTIRB data.
#
#    $ ./doc/examples/show-cfg.py /tmp/hello.gtirb
import sys

import matplotlib.pyplot as plt
import networkx as nx

import gtirb

if len(sys.argv) < 2:
    print(f"Usage: {sys.argv[0]} /path/to/file.gtirb")
    quit(1)

ir = gtirb.ir.IR.load_protobuf(sys.argv[1])
G = nx.DiGraph()

for edge in ir.cfg:
    if isinstance(edge.target, gtirb.block.ProxyBlock):
        # Represent ProxyBlocks (which don't have an address) with their UUID.
        G.add_edge(edge.source.address, edge.target.uuid)
    else:
        G.add_edge(edge.source.address, edge.target.address)

nx.draw(G, with_labels=True)
plt.show()


================================================
FILE: doc/examples/stack-stamp.md
================================================
GTIRB Stack Stamp
=================

TLDR; It is very easy to write binary transforms in GTIRB, see
[gtirb-stack-stamp](https://github.com/grammatech/gtirb-stack-stamp).

This tutorial demonstrates the development of a binary hardening
transform built on [GTIRB](https://grammatech.github.io/gtirb) (a data
structure that represents binary executables).  We implement *stack
stamping* (a simple return oriented programming, or ROP, defense) as a
GTIRB-to-GTIRB transformation.  We leverage the
[ddisasm](https://github.com/grammatech/ddisasm) front-end to
disassemble binaries to GTIRB and the
[gtirb-pprinter](https://github.com/grammatech/gtirb-pprinter)
back-end to produce a new hardened executable from the stack stamped
GTIRB.  In practice the stack-stamp transform could be chained with
other GTIRB binary analysis or transformation passes.  Implementations
of the stack stamping transform are given in all three GTIRB API
languages;
Python [API](https://grammatech.github.io/gtirb/python/index.html)/[stack_stamp.py](https://github.com/GrammaTech/gtirb-stack-stamp/blob/master/gtirb_stack_stamp/stack_stamp.py),
C++ [API](https://grammatech.github.io/gtirb/cpp/index.html)/[gtirb_stack_stamp.hpp](https://github.com/GrammaTech/gtirb-stack-stamp/blob/master/include/gtirb_stack_stamp.hpp), and
Common Lisp [API](https://grammatech.github.io/gtirb/cl/index.html)/[gtirb-stack-stamp.lisp](https://github.com/GrammaTech/gtirb-stack-stamp/blob/master/gtirb-stack-stamp.lisp).

This document walks through the whole process of writing and applying
the *stack stamping* binary ROP protection in following steps:

- A. [Install Dependencies](#a-install-all-required-libraries-and-utilities)
- B. [Lift a binary to GTIRB](#b-lift-a-binary-to-gtirb)
- C.a [Implement your own stack-stamp transform](#ca-implement-your-own-stack-stamp-transform)
- C.b [Just run our stack-stamp transform](#cb-just-run-our-stack-stamp-transform)
- D. [Serialize GTIRB to a new executable and test](#d-serialize-gtirb-to-a-new-executable-and-test)
- E. [Visualize the difference using the gtirb-ghidra-plugin](#e-visualize-the-difference-using-gtirb-ghidra-plugin)
- F. Let us know what you think.  You can open an issue against
  [github.com/grammatech/gtirb](https://github.com/grammatech/gtirb)
  or email us at `gtirb@grammatech.com`.


## A. Install all required libraries and utilities

The following should be sufficient to install the required GTIRB
libraries and utilities (for complete installation instructions see
[GTIRB#Install](https://github.com/grammatech/gtirb#installing)).

1. Install the required binaries.

   - Windows:

     > NOTE: Windows users are warned that (1) you can't assemble and
     > link your rewritten ELF file on Windows unless you have the
     > required Linux build tool installed (2) the Common Lisp APIs
     > are not tested on Windows -- although they might work.

     1. Download `ddisasm-artifacts.zip`, `gtirb-artifacts.zip`, and
        `gtirb-pprinter-artifacts.zip` from
        [https://grammatech.github.io/gtirb/pkgs/windows-release](https://grammatech.github.io/gtirb/pkgs/windows-release);
     2. Extract each ZIP file to a suitable location.
     3. Add the /bin directory from each extracted ZIP file to your `PATH` environment variable.
        (Alternatively, provide the full path when you invoke the extracted executables.)
     4. If it is not already present on your system, install
        [Protobuf](https://developers.google.com/protocol-buffers/)
        version 3.0.0 or higher.
     5. If you plan to work in C++, you will also need
        [Boost](https://www.boost.org/), version 1.68.0 or higher.

   - Ubuntu16: install the binaries from the GTIRB xenial repository as follows.
     ```bash
     sudo apt-get install software-properties-common
     sudo add-apt-repository ppa:maarten-fonville/protobuf
     sudo add-apt-repository ppa:mhier/libboost-latest
     echo "deb https://grammatech.github.io/gtirb/pkgs/xenial ./" | sudo tee -a /etc/apt/sources.list.d/gtirb.list
     sudo apt-get update
     sudo apt-get install --allow-unauthenticated libgtirb-dev gtirb-pprinter ddisasm
     ```

   - Ubuntu18: install the binaries from the GTIRB bionic repository as follows.
     ```bash
     sudo apt-get install software-properties-common
     sudo add-apt-repository ppa:mhier/libboost-latest
     echo "deb [trusted=yes] https://grammatech.github.io/gtirb/pkgs/bionic ./" | sudo tee -a /etc/apt/sources.list.d/gtirb.list
     sudo apt-get update
     sudo apt-get install libgtirb-dev gtirb-pprinter ddisasm
     ```

   - Ubuntu20: install the binaries from the GTIRB focal repository as follows.
     ```bash
     sudo apt-get install software-properties-common
     echo "deb [trusted=yes] https://grammatech.github.io/gtirb/pkgs/focal ./" | sudo tee -a /etc/apt/sources.list.d/gtirb.list
     sudo apt-get update
     sudo apt-get install libgtirb-dev gtirb-pprinter ddisasm
     ```

   - Arch Linux: install pre-built `pacman` packages from
     [https://grammatech.github.io/gtirb/pkgs/arch](https://grammatech.github.io/gtirb/pkgs/arch)
     or install using the popular [aur helper](https://wiki.archlinux.org/index.php/AUR_helpers)
     [yay](https://github.com/Jguer/yay),
     ```bash
     yay -Sy gtirb-git gtirb-pprinter-git ddisasm-git
     ```

2. For the Common Lisp and C++ API, install [Keystone](https://github.com/keystone-engine/keystone).
   Keystone does not have prebuilt packages, so you must install this from
   source.  For Linux systems, this generally looks like:
   ```bash
   git clone https://github.com/keystone-engine/keystone.git
   cd keystone
   mkdir build
   cd build
   ../make-share.sh
   make install
   ```

3. Make sure the required GTIRB components are available to your
   development environment.  This will depend on the language you want
   to work in:

   - C++: when you compile your transform, do all of the following.
     - Specify that the GTIRB `lib/` is a library directory.
     - Specify that the GTIRB `include/` is an include directory.
     - Link against the `gtirb` and `proto` libraries
       (Windows: `gtirb.lib`, `proto.lib`; Linux: `gtirb.so`, `proto.so`).

   - Python (note: must be Python 3):
     ```bash
     pip3 install gtirb gtirb-functions gtirb-capstone
     ```

   - Common Lisp:
     1. Clone the latest versions of these repositories into your
        `~/quicklisp/local-projects` directory (the versions in quicklisp
        don't yet have some important bugfixes)
        ```bash
        cd ~/quicklisp/local-projects
        git clone https://github.com/brown/protobuf
        git clone --single-branch --branch quicklisp https://github.com/grammatech/gtirb
        git clone https://github.com/grammatech/gtirb-capstone
        git clone https://github.com/grammatech/gtirb-functions
        ```

     2. Install with quicklisp.
        ```lisp
        (ql:quickload '(:gtirb :gtirb-functions :gtirb-capstone))
        ```

## B. Lift a binary to GTIRB

GrammaTech's open-source GTIRB tooling supports disassembly of ELF
binaries only.

The example used in this tutorial is a Linux `ls` binary.  If you
prefer, you can work with a different ELF binary: just amend the
command lines as necessary to accommodate any file name differences.

If you are on a Linux system, you can analyze your system `ls`. For
Windows users, we have provided additional instructions for obtaining
a Linux `ls` binary.

Ubuntu 16, Ubuntu18, Ubuntu20, Arch Linux:

  1. Change to a suitable working directory.

  2. Run the datalog disassembler to analyze the binary and produce a
     GTIRB representation.

     ```bash
     ddisasm $(which ls) --ir ls.gtirb
     ```


Windows:

  1. Do you have easy access to a Linux `ls` binary? (For example, can
     you copy one from another local system?)

     - YES: Copy the binary to a suitable working directory and go to step 4.

     - NO: Go on to step 2.

  2. Download a Linux coreutils package from
     http://launchpadlibrarian.net/340091849/coreutils_8.26-3ubuntu4_amd64.deb
     (or another location if you prefer).

  3. Use a tool such as [7-Zip](https://www.7-zip.org/) to extract
     `/bin/ls` from the package, then copy it to a suitable working
     directory.

     (If your tool does not support selective extraction, unpack the
     entire package to a temporary location, then copy `/bin/ls` to
     your working directory.)

  4. Change to your working directory.


If you are not able to successfully analyze your chosen binary, please
[open an issue](https://github.com/GrammaTech/ddisasm/issues/new) to
let us know.


## C.a Implement your own stack-stamp transform

Stack stamping is a technique to help mitigate ROP style attacks.
This is done by 'stamping' (`xor`ing with a random number) the return
address on the stack at the beginning of every function, thus
encrypting it.  At the end of the function, before the return address
is popped off the stack and used, it is decrypted by `xor`ing it again
with the same random number.  This can be a very efficient protection.
Because it only requires an `xor` instruction this implementation
requires no registers, and while flags are affected, they are only
affected at function entry/exits where they do not need to be
preserved.  The effect of encrypting and decrypting the return address
on the stack like this is that ROP payloads become much more difficult
to write.  The attacker would have to know the random `xor` number for
every return to encrypt the return addresses in the payload.  These
numbers could easily be regenerated for every instance of a deployed
binary making generic payloads impossible.

![Stack Stamp Figure](.stack-stamp.svg)

Regardless of the implementation language the mechanics of this
transform will be the same -- we'll write a GTIRB-to-GTIRB rewriting
pass (the design of GTIRB is similar to LLVM in that it leverages
stand-alone passes for analysis or transformation).

```
  For each function f that has a single entry and single return.
     Build a random key k_f for f.
     On entry to f, encrypt the return address using k_f.
     On exit from f, decrypt the return address using k_f.
```


1. Implement the transform, using the [GTIRB
   manual](https://grammatech.github.io/gtirb/) as a reference.

   If you're developing in Python or Common Lisp you can work directly in
   a Read Eval Print Loop (REPL), or use it to
   prototype a stand-alone implementation.

   - For all languages, start by importing the `gtirb` API and then
   loading your `ls.gtirb` file. For Common Lisp and Python, you will
   also need to import the `gtirb-functions` and `gtirb-capstone`
   APIs.

      - Python
        ```python
        from gtirb import *
        import gtirb_functions
        import gtirb_capstone
        ir = IR.load_protobuf("ls.gtirb")
        ```

      - C++
        ```c++
        #include <gtirb.hpp>
        gtirb::Context Ctx;
        std::ifstream File("ls.gtirb");
        gtirb::IR* Ir = *gtirb::IR::load(Ctx, File);
        ```

      - Common Lisp
        ```lisp
        (mapcar #'use-package '(:gtirb :gtirb-capstone :gtirb-functions))
        (defparameter *ir* (read-gtirb "ls.gtirb"))
        ```

   - The mechanism for identifying functions and their entry points
     depends on the API language you are using.

     - Python: Use the `gtirb-functions` API functionality
       ([Python](https://github.com/GrammaTech/gtirb-functions/tree/master/gtirb_functions))
       to obtain the set of recovered functions, and the
       sets of entry and exit blocks for each function.

     - C++: The GTIRB
       [sanctioned AuxData tables](https://grammatech.github.io/gtirb/md__aux_data.html)
       are populated by `ddisasm`: use the `gtirb` API to access the
       information in these tables.

     - Common Lisp: Use the `gtirb-functions` API functionality
       ([Common Lisp](https://github.com/GrammaTech/gtirb-functions/blob/master/gtirb-functions.lisp))
       to obtain the set of recovered functions, and the
       sets of entry and exit blocks for each function.


2. When you're done, compare your implementation to the corresponding
   completed transform in the gtirb-stack-stamp repository on GitHub:

   - [Python](https://github.com/GrammaTech/gtirb-stack-stamp/blob/master/gtirb_stack_stamp/stack_stamp.py#L36)
   - [C++](https://github.com/GrammaTech/gtirb-stack-stamp/blob/master/src/gtirb_stack_stamp.cpp)
   - [Common Lisp](https://github.com/GrammaTech/gtirb-stack-stamp/blob/master/gtirb-stack-stamp.lisp#L24)


3. Apply your transform to `ls.gtirb`.

4. Serialize the transformed GTIRB to a new file `ls-ss.gtirb`.

   - Python
     ```python
     ir.save_protobuf("ls-ss.gtirb")
     ```

   - C++
     ```c++
     std::ofstream File("ls-ss.gtirb");
     Ir->save(File);
     ```

   - Common Lisp
     ```lisp
     (write-gtirb *ir* "ls-ss.gtirb")
     ```

## C.b Just run our stack-stamp transform

If you're interested in applying this transform but not writing it
yourself you can try our implementation available at
[https://github.com/GrammaTech/gtirb-stack-stamp](https://github.com/GrammaTech/gtirb-stack-stamp).

- Python
  ```bash
  pip install gtirb
  python -m gtirb_stack_stamp /tmp/ls.gtirb --outfile /tmp/ls-ss.gtirb --rebuild /tmp/ls-ss
  ```

- C++
  ```bash
  mkdir build
  cmake -Bbuild
  make -Cbuild
  ./build/bin/gtirb-stack-stamp -i /tmp/ls.gtirb -o /tmp/ls-ss.gtirb
  ```

- Common Lisp
  ```bash
  sbcl --eval '(ql:quickload :gtirb-stack-stamp)' --eval '(asdf:make :gtirb-stack-stamp :type :program :monolithic t)'
  ./stack-stamp -g /tmp/ls-ss.gtirb -b /tmp/ls-ss
  ```

## D. Serialize GTIRB to a new executable and test

The final step is to use the GTIRB pretty printer to convert your
GTIRB representation to a new binary.

> NOTE: Although you can pretty-print GTIRB to assembly on Windows you
> can't actually assemble or link the assembler to an ELF file on
> Windows because the required `as` and `ld` commands are typically
> not installed.  So this is likely the end of the road for users
> without access to a Linux machine.

1. Run the following command.

   ```bash
   gtirb-pprinter ls-ss.gtirb --skip-section .eh_frame \
               --asm ls.ss.s \
               --binary ls.ss
   ```

2. Try running the new binary. Its behavior should be
   indistinguishable from the original.

   (You will not be able to do this on Windows. However, if you have
   access to a Linux system, you can copy your new binary there and
   try it out.)

## E. Visualize the difference using gtirb-ghidra-plugin

[Ghidra](https://ghidra-sre.org) is a reverse engineering framework
developed by the National Security Agency (NSA).
With a GTIRB plug-in, Ghidra offers a useful GUI for examining the
differences between GTIRB files.

Procedure:

- a. [Install prerequisites if they are not already installed](#a-install-prerequisites-if-they-are-not-already-installed)
- b. [Import and analyze the files](#b-import-and-analyze-the-files)
- c. [Use the Version Tracking tool to match function locations](#c-use-the-version-tracking-tool-to-match-function-locations)
- d. [Examine the changes in a side-by-side view](#d-examine-the-changes-in-a-side-by-side-view)


### a. Install prerequisites if they are not already installed

1. Java 11 (a prerequisite for Ghidra):
   [Ubuntu18](https://www.linuxbabe.com/ubuntu/install-oracle-java-8-openjdk-11-ubuntu-18-04-18-10),
   [Windows](https://access.redhat.com/documentation/en-us/openjdk/11/html/openjdk_11_for_windows_getting_started_guide/index)

2. [Ghidra](https://ghidra-sre.org/).

3. The [GTIRB Ghidra plugin](https://github.com/GrammaTech/gtirb-ghidra-plugin).


### b. Import and analyze the files

1. Start Ghidra and open a project or create a new one.

2. Import `ls.gtirb` and double-click it to open a Code Browser.

3. When prompted to analyze it, hit "Yes" and select "Disassemble
   Entry Points" (only).

   This will populate the listing with disassembly for all functions.

4. When the analysis is complete, save the file and close the Code
   Browser.

5. Repeat steps 2-4 for `ls-ss.gtirb`

### c. Use the Version Tracking tool to match function locations

1. Click on the "Footprints" icon to start the Version Tracking tool.

2. The Version Tracking tool also has a footprints icon, click on this
   to start a new session wizard.

3. Enter a session name and select the before and after files as
   Source and Destination.

4. Skip the precondition checks and click Finish.

   This will open source and destination tools, which you can
   minimize as we don't need them.

### d. Examine the changes in a side-by-side view

1. In the Version Tracking tool, click the green "+" (plus sign) to start
   comparing the files.

2. In the wizard that comes up, select "Exact Symbol Name Match"
   (only). This will allow us to do a side-by-side comparison of
   functions of the same name.

3. Click Next and Finish.

   The Version Tracking Matches window will be populated with a list
   of matches. (If you don't see a Version Tracking Matches window, go
   to Window in the top menu and select Version Tracking
   Matches).

4. Select a function by clicking on a row with type
   Function.

5. Go to the Version Tracking Markup window to see a comparison of
   this function (if you don't see source and destination sections in
   the Version Tracking Markup window, click the "Book" icon in the
   upper right corner of the Version Tracking Markup window.


================================================
FILE: doc/general/AuxDataContainer.md
================================================
AuxDataContainer
================

An AuxDataContainer object provides functionality for associating
[auxiliary data](../AuxData.md) with elements of the representation.

Guaranteed Properties
---------------------

- An **AuxDataContainer** must have all the guaranteed properties of a
  [Node](Node.md).
  - It is *not* required that **AuxDataContainer** be a subclass of
    **Node**, even if the API language would support this.

- All **AuxDataContainer** objects store a (possibly empty) map of
  strings to [AuxData](../AuxData.md) entries.

- The string->AuxData map must provide the following functionality.
  - Insert or overwrite AuxData given a name, a type hint string, and
    a value of the correct target-language type.
  - Erase an existing AuxData given its name.
  - Retrieve AuxData of a given name (and given target-language type,
    if the target language needs this information).
  - Inspect AuxData of a given name and determine its type hint.

- The AuxData system must have the following properties.
  - All core types in the AuxData system must have a corresponding
    type in the target language.
  - AuxData of all types, including unknown types, must be retrievable
    as a byte array.


API Implementations
-------------------

The guaranteed functionality is provided as follows.

### AuxDataContainer Classes and Node properties

| Language    | AuxDataContainer Class  | guaranteed Node Properties           |
|:------------|:------------------------|:-------------------------------------|
| C++         | gtirb::AuxDataContainer | through inheritance from gtirb::Node |
| Python      | gtirb.AuxDataContainer  | through inheritance from gtirb.Node  |
| Common Lisp | No explicit implementation; relevant classes **ir** and **module** implement required functionality directly. | . |

### string->AuxData map


| Language    | Get AuxData by name  | Insert/Overwrite AuxData  | Erase AuxData   |
|:------------|:---------------------|:--------------------------|:----------------|
| C++         |  gtirb::AuxDataContainer::getAuxData () | gtirb::AuxDataContainer::addAuxData(), gtirb::AuxData::operator=() | gtirb::AuxDataContainer::removeAuxData() |
| Python      | dict lookup in gtirb.AuxDataContainer.auxdata | dict insert/overwrite on gtirb.AuxDataContainer.auxdata | dict pop on gtirb.AuxDataContainer.auxdata |
| Common Lisp | **aux-data** *object* => *result* has **module** and **gtirb** specializations; extract the required named data extraction from the *result* alist |  extract auxiliary data alist with **aux-data** accessor, update alist as needed, then use (setf (**aux-data** *object*) *new-value*) which has **module** and **gtirb** specializations | as for insert/overwrite |


### AuxData Inspection


| Language    | Get AuxData data                         | Get AuxData type hint                    |
|:------------|:-----------------------------------------|:-----------------------------------------|
| C++         | gtirb::AuxData::get()                    | gtirb::AuxData::typeName()               |
| Python      | gtirb.AuxData.data                       | gtirb.AuxData.type_name                  |
| Common Lisp | **aux-data-data** *aux-data* => *result* | **aux-data-type** *aux-data* => *result* |


Links
--------------------

- [Standard AuxData Schemata](../../AuxData.md)
- [GTIRB Components](COMPONENTS.md)
- [Using Serialized GTIRB Data](../../PROTOBUF.md)


================================================
FILE: doc/general/Block.md
================================================
Block
============

**Block** represents a base class for blocks. [Symbol](Symbol.md)
objects may have references to any kind of **Block**.

Guaranteed Properties
---------------------

- A **Block** is a [Node](Node.md).


API Implementations
--------------------

The guaranteed functionality is provided as follows.

### Block Classes

| Language    | Block Class     |
|:------------|:----------------|
| C++         | no explicit **Block** class; see individual classes gtirb::CodeBlock ([CodeBlock](CodeBlock.md)), gtirb::DataBlock ([DataBlock](DataBlock.md)),  gtirb::CfgNode ([CfgNode](CfgNode.md)) |
| Python      | gtirb.Block     |
| Common Lisp | **gtirb-block** |


Links
--------------------

- [GTIRB Components](COMPONENTS.md)
- [Using Serialized GTIRB Data](../../PROTOBUF.md)


================================================
FILE: doc/general/ByteBlock.md
================================================
ByteBlock
====================

**ByteBlock** is the base class for blocks that belong to a
[ByteInterval](ByteInterval.md) and store their bytes there.


Guaranteed Properties
---------------------

- A **ByteBlock** is a [Block](Block.md).

- Each **ByteBlock** object must store an integral **size** that is
  readable and writable.

- Each **ByteBlock** must belong to either zero (0) or one (1)
  [ByteInterval](ByteInterval.md) objects. The owning **ByteInterval**
  must be stored as a reference.
  - This reference may be null, in which case the **ByteBlock** is
    freestanding and does not belong to any **ByteInterval**.

- If a **ByteBlock** belongs to a **ByteInterval** then it must be
  able to retrieve its offset in the **ByteInterval**.

- If a **ByteBlock** belongs to a **ByteInterval** that has an address
  then it must be able to retrieve its address, calculated as the
  **ByteInterval** address plus the **ByteBlock** offset.


API Implementations
--------------------

The guaranteed functionality is provided as follows.

### ByteBlock Classes

| Language    | ByteBlock Class |
|:------------|:----------------|
| C++         | no explicit **ByteBlock** class; see individual classes gtirb::CodeBlock ([CodeBlock](CodeBlock.md)), gtirb::DataBlock ([DataBlock](DataBlock.md)) |
| Python      | gtirb.ByteBlock    |
| Common Lisp | **gtirb-byte-block** |


### Size Getters/Setters

| Language    | Get size                  | Set size                  |
|:------------|:--------------------------|:--------------------------|
| C++         | gtirb::CodeBlock::getSize(), gtirb::DataBlock::getSize() | gtirb::CodeBlock::setSize(), gtirb::DataBlock::setSize() |
| Python      | read gtirb.ByteBlock.size   | write gtirb.ByteBlock.size  |
| Common Lisp | **size** (*obj* *code-block*) => *result*, **size** (*obj* *data-block*) => *result* | (setf (**size** (*obj* *code-block*)) *new*), (setf (**size** (*obj* *data-block*)) *new*) |


### Associated ByteInterval

#### Get Associated ByteInterval

| Language    | Get Associated ByteInterval         |
|:------------|:------------------------------------|
| C++         | gtirb::ByteBlock::getByteInterval() |
| Python      | gtirb.ByteBlock.byte_interval       |
| Common Lisp | **byte-interval** (*object* *code-block*) => *result*,  **byte-interval** (*object* *data-block*) => *result* |


#### ByteBlock Offset in Associated ByteInterval

| Language    | Offset                              |
|:------------|:------------------------------------|
| C++         | gtirb::CodeBlock::getOffset(), gtirb::DataBlock::getOffset() |
| Python      | gtirb.ByteBlock.offset              |
| Common Lisp | **offset** (*obj* *code-block*) => *result*,  **offset** (*obj* *data-block*) => *result* |


#### ByteBlock Address

| Language    | Address                          |
|:------------|:---------------------------------|
| C++         | gtirb::DataBlock::getAddress(), gtirb::DataBlock::getAddress() |
| Python      | gtirb.ByteBlock.address          |
| Common Lisp | **address** *obj* => *result*    |


Links
--------------------

- [GTIRB Components](COMPONENTS.md)
- [Using Serialized GTIRB Data](../../PROTOBUF.md)


================================================
FILE: doc/general/ByteInterval.md
================================================
ByteInterval
====================

A **ByteInterval** represents a named section of a binary.

The corresponding Protobuf message type is `ByteInterval`.


Guaranteed Properties
---------------------

- A **ByteInterval** is a [Node](Node.md).

- Each **ByteInterval** object must have the following information,
  and the API must provide functionality for getting and setting each.

  - **blocks** (as a collection of [ByteBlock](ByteBlock.md) objects,
    in offset order)

  - **symbolic_expressions** (as a collection of
    [SymbolicExpression](SymbolicExpression.md) objects, in offset
    order)

  - **contents** (as a byte array)

  - **size**

  - **address** (Must be either optional or nullable. It is not valid
    to have a sentinel value in the range of a 64-bit integer as an
    indication of nullness.)

- A **ByteInterval** must provide the following functionality for its
  **blocks**.
  - Insert a **ByteBlock** at a specified offset.
  - Remove an existing **ByteBlock**.
  - Retrieve all **ByteBlock** objects at a specified offset.
  - Iterate over all **ByteBlock** objects.
  - Find all **CodeBlock** objects that intersect a given address or
    range of addresses.
  - Find all **CodeBlock** objects that start at a given address or
    range of addresses. This operation must complete in O(m + log n) time,
    where m is the size of the returned set and n is the number of
    **ByteBlock** objects in **blocks**.
  - Find all **DataBlock** objects that intersect a given address or
    range of addresses.
  - Find all **DataBlock** objects that start at a given address or
    range of addresses. This operation must complete in O(m + log n) time,
    where m is the size of the returned set and n is the number of
    **ByteBlock** objects in **blocks**.

- A **ByteInterval** must provide the following functionality for its
  **symbolic_expressions**.
  - Insert a **SymbolicExpression** at a specified offset.
  - Remove an existing **SymbolicExpression**.
  - Retrieve all **SymbolicExpression** objects at a specified offset.
  - Iterate over all **SymbolicExpression** objects.
  - Find all **SymbolicExpression** objects that start at a given
    address or range of addresses. This operation must complete in
    O(log n) time, where n is the number of **SymbolicExpression**
    objects in **symbolic_expressions**. (There is no corresponding
    address *intersection* requirement: **SymbolicExpressions** have no size.)


- The **contents** have the following requirements.
  - The size of **contents** must be less than or equal to the size of
    the **ByteInterval**.
  - If the size of a **ByteInterval** is changed to a value that is
    less than the size of its **contents**, its **contents** must be
    truncated.


- Each **ByteInterval** must belong to either zero (0) or one (1)
  [Section](Section.md) objects. The owning **Section** must be stored as
  a reference.
  - This reference may be null, in which case the **ByteInterval** is
    freestanding and does not belong to any **Section**.


API Implementations
--------------------

The guaranteed functionality is provided as follows.

### ByteInterval Classes

| Language    | ByteInterval Class  |
|:------------|:--------------------|
| C++         | gtirb::ByteInterval |
| Python      | gtirb.ByteInterval  |
| Common Lisp | **byte-interval**   |


### blocks

#### Get and Set


| Language    | Get blocks | Set blocks |
|:------------|:---------------|:---------------|
| C++         | gtirb::ByteInterval::blocks() | gtirb::ByteInterval::addBlock(), gtirb::ByteInterval::RemoveBlock() |
| Python      | read gtirb.ByteInterval.blocks | write gtirb.ByteInterval.blocks |
| Common Lisp | **blocks** (*object* *byte-interval*) => *result* | (setf (**blocks** (*object* *byte-interval*)) *new-value*) |


#### ByteBlock operations


| Language    | Insert at offset | Remove | Retrieve from offset | Iterate |
|:------------|:---------------|:---------------|:---------------|:---------------|
| C++         | gtirb::ByteInterval::addBlock() | gtirb::ByteInterval::removeBlock() | gtirb::ByteInterval::findBlocksAtOffset | gtirb::ByteInterval::blocks_begin() |
| Python      | for all these operations, interact directly with gtirb.ByteInterval.blocks: each gtirb.ByteBlock object stores its own offset. | . | . | . |
| Common Lisp | for all these operations, interact with the blocks through the **blocks** accessor: each **byte-block** object stores its own offset. | . | . | . |


#### Find  CodeBlock Objects...

| Language    | ...that intersect an address/range | ...that begin at an address/range
|:------------|:---------------------------|:---------------------------|
| C++         | gtirb::ByteInterval::findCodeBlocksOn() | gtirb::ByteInterval::findCodeBlocksAt() |
| Python      | gtirb.ByteInterval.code_blocks_in() | gtirb.ByteInterval.code_blocks_at() |
| Common Lisp | **in-address** *object* *start-address* &optional *end-address* => *result*, then filter *result* to extract the **code-block** objects | **at-address** *object* *address* => *result*, then filter *result* to extract the **code-block** objects. [*] |

[*] Address range checking is not yet implemented for Common Lisp
**at-address**


#### Find  DataBlock Objects...

| Language    | ...that intersect an address/range | ...that begin at an address/range
|:------------|:---------------------------|:---------------------------|
| C++         | gtirb::ByteInterval::findDataBlocksOn() | gtirb::ByteInterval::findDataBlocksAt() |
| Python      | gtirb.ByteInterval.data_blocks_in() | gtirb.ByteInterval.data_blocks_at() |
| Common Lisp |  **in-address** *object* *start-address* &optional *end-address* => *result*, then filter *result* to extract the **data-block** objects | **at-address** *object* *address* => *result*, then filter *result* to extract the **data-block** objects. [*] |

[*] Address range checking is not yet implemented for Common Lisp
**at-address**


### symbolic_expressions

#### Get and Set

| Language    | Get symbolic_expressions | Set symbolic_expressions |
|:------------|:---------------|:---------------|
| C++         | gtirb::ByteInterval | gtirb::ByteInterval |
| Python      | gtirb.ByteInterval |  gtirb.ByteInterval |
| Common Lisp | **symbolic-expressions** (*object* *byte-interval*) => *result* | (setf (**symbolic-expressions** (*object* *byte-interval*)) *new-value*) |


#### Find SymbolicExpression Objects...

| Language    | ...that begin at an address/range                |
|:------------|:-------------------------------------------------|
| C++         | gtirb::ByteInterval::findSymbolicExpressionsAt() |
| Python      | gtirb.ByteInterval.symbolic_expressions_at()     |
| Common Lisp |  **at-address** *object* *address* => *result*, then filter *result* to extract the symbolic expression objects. [*] |

[*] Address range checking is not yet implemented for Common Lisp
**at-address**

#### Other Required SymbolicExpression Operations


| Language    | Insert at offset | Remove | Retrieve from offset | Iterate |
|:------------|:---------------|:---------------|:---------------|:---------------|
| C++         | gtirb::ByteInterval::addSymbolicExpression() | gtirb::ByteInterval::removeBlock() | gtirb::ByteInterval::findSymbolicExpressionsAtOffset | gtirb::ByteInterval::symbolic_expressions_begin() |
| Python      | for all these operations, interact directly with gtirb.ByteInterval.symbolic_expressions, which is a mapping indexed by offset. | . | . | . |
| Common Lisp | for all these operations, interact with the SymbolicExpression objects through the **symbolic-expressions** accessor: **symbolic-expression** hashes are keyed by offset. | . | . | . |


### contents

#### Get and Set


| Language    | Get contents | Set contents |
|:------------|:-------------|:-------------|
| C++         | read gtirb::ByteInterval::bytes() | write gtirb::ByteInterval::bytes() |
| Python      | read gtirb.ByteInterval.contents  | write gtirb.ByteInterval.contents |
| Common Lisp | **contents** (*obj* *byte-interval*) => *result* | (setf (**contents** (*obj* *byte-interval*)) *new*) |


### size

#### Get and Set


| Language    | Get size                      | Set size                      |
|:------------|:------------------------------|:------------------------------|
| C++         | gtirb::ByteInterval.getSize() | gtirb::ByteInterval.setSize() |
| Python      | read gtirb.ByteInterval.size  | write gtirb.ByteInterval.size |
| Common Lisp | **size** (*obj* *byte-interval*) => *result* | (setf (**size** (*obj* *byte-interval*)) *new*) |


### address

#### Get and Set


| Language    | Get address | Set address |
|:------------|:------------|:------------|
| C++         | gtirb::ByteInterval::getAddress() | gtirb::ByteInterval::setAddress |
| Python      | read gtirb.ByteInterval.address | write gtirb.ByteInterval.address |
| Common Lisp | **address** (*obj* *byte-interval*) => *result* | (setf (**address** (*obj* *byte-interval*)) *new*) |


### Associated Section


| Language    | Associated Section                                 |
|:------------|:---------------------------------------------------|
| C++         | gtirb::ByteInterval::getSection()                  |
| Python      | gtirb.ByteInterval.section                         |
| Common Lisp | **section** (*object* *byte-interval*) => *result* |


Links
--------------------

- [GTIRB Components](COMPONENTS.md)
- [Using Serialized GTIRB Data](../../PROTOBUF.md)


================================================
FILE: doc/general/CFG.md
================================================
CFG
====================

A **CFG** represents the interprocedural control flow graph.

The corresponding Protobuf message type is `CFG`.

- The vertices of a **CFG** correspond to [CfgNode](CfgNode.md)
  - objects.  Every **CfgNode** object in the [IR](IR.md) is
    potentially a vertex in the **CFG**.

- The edges of a **CFG** correspond to [CfgEdge](CfgEdge.md) objects.

- There are no guaranteed properties for the **CFG**. There are,
  however, guaranteed properties for constituent components
  [CfgNode](CfgNode.md) and [CfgEdgeLabel](CfgEdgeLabel.md).


API Implementations
--------------------


| Language    | CFG Implementation     |
|:------------|:-----------------------|
| C++         | gtirb::CFG             |
| Python      | typing.set[gtirb.Edge] |
| Common Lisp | a [graph:digraph](http://eschulte.github.io/graph/) whose nodes hold **code-block** UUIDs and edges are labeled with **edge_label** objects    |


Links
--------------------

- [Advice on when to Place ICFG Edges](../CFG-Edges.md)
- [GTIRB Components](COMPONENTS.md)
- [Using Serialized GTIRB Data](../../PROTOBUF.md)


================================================
FILE: doc/general/CMakeLists.txt
================================================
# based on sample in https://majewsky.wordpress.com/2010/08/14/tip-of-the-day-
# cmake-and-doxygen/ add a target to generate API documentation with Doxygen

cmake_minimum_required(VERSION 3.3)

find_package(Doxygen 1.8.11)
if(DOXYGEN_FOUND)

  set(DOC_INDIR "${CMAKE_CURRENT_SOURCE_DIR}/..")
  set(ROOTDIR "${CMAKE_CURRENT_SOURCE_DIR}/../..")

  set(BUILDFILES_IN ../preprocmd.py DoxygenLayout.xml)
  foreach(_inf ${BUILDFILES_IN})
    configure_file(
      ${CMAKE_CURRENT_SOURCE_DIR}/${_inf} ${CMAKE_CURRENT_BINARY_DIR}/${_inf}
      @ONLY
    )
  endforeach()

  # Handle version initialization
  file(READ "${ROOTDIR}/version.txt" ver)

  string(REGEX MATCH "VERSION_MAJOR ([0-9]*)" _ ${ver})
  set(GTIRB_MAJOR_VERSION ${CMAKE_MATCH_1})

  string(REGEX MATCH "VERSION_MINOR ([0-9]*)" _ ${ver})
  set(GTIRB_MINOR_VERSION ${CMAKE_MATCH_1})

  string(REGEX MATCH "VERSION_PATCH ([0-9]*)" _ ${ver})
  set(GTIRB_PATCH_VERSION ${CMAKE_MATCH_1})

  configure_file(
    "${ROOTDIR}/include/gtirb/version.h.in"
    "${ROOTDIR}/include/gtirb/version.h" @ONLY
  )

  configure_file(
    "${CMAKE_CURRENT_SOURCE_DIR}/Doxyfile.in"
    "${CMAKE_CURRENT_BINARY_DIR}/Doxyfile" @ONLY
  )

  configure_file(
    "${CMAKE_CURRENT_SOURCE_DIR}/examples.dox"
    "${CMAKE_CURRENT_BINARY_DIR}/examples.dox" @ONLY
  )

  # adapted from https://gist.github.com/abravalheri/11214134

  macro(move_filename file_list newdir)
    foreach(src_file ${${file_list}})
      get_filename_component(src_file_name "${src_file}" NAME)
      list(REMOVE_ITEM ${file_list} "${src_file}")
      list(APPEND ${file_list} "${newdir}/${src_file_name}")
    endforeach()
  endmacro()

  # ----------------------------------------------------------------------
  # copy dot files into a subdir of the working directory
  # ----------------------------------------------------------------------
  file(GLOB DOTFILES_IN "${DOC_INDIR}/dot/*")

  set(DOTFILES ${DOTFILES_IN})
  move_filename(DOTFILES ${CMAKE_CURRENT_BINARY_DIR})

  # message("DOTFILES = ${DOTFILES}")

  add_custom_command(
    OUTPUT ${DOTFILES}
    WORKING_DIRECTORY ${CMAKE_CURRENT_BINARY_DIR}
    DEPENDS ${DOTFILES_IN}
    COMMAND mkdir -p dot
    COMMAND ${CMAKE_COMMAND} -E copy_directory ${DOC_INDIR}/dot dot
    COMMENT "copying dot dir"
    VERBATIM
  )

  # ----------------------------------------------------------------------
  # copy md files into the working directory
  # ----------------------------------------------------------------------

  set(MDFILES_IN
      "${DOC_INDIR}/general/AuxDataContainer.md"
      "${DOC_INDIR}/general/Block.md"
      "${DOC_INDIR}/general/ByteBlock.md"
      "${DOC_INDIR}/general/ByteInterval.md"
      "${DOC_INDIR}/general/CFG.md"
      "${DOC_INDIR}/general/CfgEdge.md"
      "${DOC_INDIR}/general/CfgEdgeLabel.md"
      "${DOC_INDIR}/general/CfgNode.md"
      "${DOC_INDIR}/general/CodeBlock.md"
      "${DOC_INDIR}/general/COMPONENTS.md"
      "${DOC_INDIR}/general/DataBlock.md"
      "${DOC_INDIR}/general/IR.md"
      "${DOC_INDIR}/general/Module.md"
      "${DOC_INDIR}/general/Node.md"
      "${DOC_INDIR}/general/ProxyBlock.md"
      "${DOC_INDIR}/general/Section.md"
      "${DOC_INDIR}/general/Symbol.md"
      "${DOC_INDIR}/general/SymbolicExpression.md"
      "${DOC_INDIR}/general/SymAddrAddr.md"
      "${DOC_INDIR}/general/SymAddrConst.md"
      "${DOC_INDIR}/general/Version.md"
      "${DOC_INDIR}/binary-representation.md"
      "${DOC_INDIR}/CFG-Edges.md"
      "${ROOTDIR}/AuxData.md"
      "${ROOTDIR}/CONTRIBUTING.md"
      "${ROOTDIR}/FAQ.md"
      "${ROOTDIR}/PROTOBUF.md"
      "${ROOTDIR}/README.md"
      "${DOC_INDIR}/examples/stack-stamp.md"
  )
  set(MDFILES ${MDFILES_IN})
  move_filename(MDFILES ${CMAKE_CURRENT_BINARY_DIR})

  gtirb_find_python()
  foreach(_inmd ${MDFILES_IN})
    get_filename_component(_outmd "${_inmd}" NAME)
    add_custom_command(
      OUTPUT ${_outmd}
      WORKING_DIRECTORY ${CMAKE_CURRENT_BINARY_DIR}
      DEPENDS ${_inmd} ../preprocmd.py
      COMMAND ${CMAKE_COMMAND} -E copy ${_inmd} "${_outmd}.in"
      COMMAND ${PYTHON} ../preprocmd.py "${_outmd}.in" ${_outmd}
      COMMENT "processing ${_outmd}"
      VERBATIM
    )
  endforeach()

  set(SVGFILES_IN "${ROOTDIR}/.gtirb.svg"
                  "${DOC_INDIR}/examples/.stack-stamp.svg"
  )
  set(SVGFILES ${SVGFILES_IN})
  move_filename(SVGFILES ${CMAKE_CURRENT_BINARY_DIR})

  foreach(_insvg ${SVGFILES_IN})
    get_filename_component(_outsvg "${_insvg}" NAME)
    add_custom_command(
      OUTPUT ${_outsvg}
      WORKING_DIRECTORY ${CMAKE_CURRENT_BINARY_DIR}
      DEPENDS ${_insvg}
      COMMAND ${CMAKE_COMMAND} -E copy ${_insvg} "${_outsvg}"
      COMMENT "copying ${_outsvg}"
      VERBATIM
    )
  endforeach()

  # ----------------------------------------------------------------------
  # Main target
  # ----------------------------------------------------------------------

  add_custom_target(
    general_doxyout
    WORKING_DIRECTORY ${CMAKE_CURRENT_BINARY_DIR}
    DEPENDS ${MDFILES}
    DEPENDS ${SVGFILES}
    COMMAND ${DOXYGEN_EXECUTABLE} ${CMAKE_CURRENT_BINARY_DIR}/Doxyfile
    COMMENT "Generating general API documentation with Doxygen"
    VERBATIM
  )

  add_dependencies(doc general_doxyout)

  if(CXX_API)
    add_dependencies(general_doxyout cpp_doxyout)
  endif()

endif(DOXYGEN_FOUND)


================================================
FILE: doc/general/COMPONENTS.md
================================================
GTIRB Components
================

The pages in this section serve two purposes.

* A language-agnostic description of the representation components,
  with references to language-specific API implementations of these
  components.

* A normative description of required API features for GTIRB.
  If you implement a new API for GTIRB, it must satisfy all these requirements.


Components that must be represented
-----------------------------------

| Component                                 | Protobuf Message Type | Notes |
|-------------------------------------------|-----------------------|-------|
| [Node](Node.md)                           | -                     | Root class for many components |
| [IR](IR.md)                               | `IR`                  | A complete internal representation. |
| [Module](Module.md)                       | `Module`              | Represents a single binary (library or executable) |
| [Section](Section.md)                     | `Section`             | A named section of a binary. |
| [ByteInterval](ByteInterval.md)           | `ByteInterval`        | A contiguous region of bytes in a binary.|
| [CodeBlock](CodeBlock.md)                 | `CodeBlock`           | A basic block in the binary. |
| [DataBlock](DataBlock.md)                 | `DataBlock`           | A data object, possibly symbolic. |
| [ProxyBlock](ProxyBlock.md)               | `ProxyBlock`          | A placeholder to serve as the endpoint (source or target) of a [CfgEdge](CfgEdge.md). |
| [Symbol](Symbol.md)                       | `Symbol`              | Maps a name to an object in the IR. |
| [CFG](CFG.md)                             | `CFG`                 | The interprocedural control flow graph. |
| [AuxDataContainer](AuxDataContainer.md)   | -                     | Functionality for associating [auxiliary data](AuxData.md) with elements of the representation.      |
| [Block](Block.md)                         | -                     | Base class for blocks. |
| [ByteBlock](ByteBlock.md)                 | -                     | Base class for blocks that belong to a **ByteInterval** and store their bytes there. |
| [CfgNode](CfgNode.md)                     | -                     | A block that may appear as a vertex in the CFG. |
| [CfgEdge](CfgEdge.md)                     | `Edge`                | An edge in the CFG. |
| [CfgEdgeLabel](CfgEdgeLabel.md)           | `EdgeLabel`           | The label on a CfgEdge. |
| [SymbolicExpression](SymbolicExpression.md) | -                     | A data value or instruction operand which should be interpreted as referring to a symbol. |
| [SymAddrConst](SymAddrConst.md)           | `SymAddrConst`        | A symbolic operand of the form "Sym + Offset". |
| [SymAddrAddr](SymAddrAddr.md)             | `SymAddrAddr`         | A symbolic operand of the form "(Sym1 - Sym2) / Scale + Offset". |
| [Version information](Version.md)         | -                     | The applicable GTIRB and Protobuf versions. |


================================================
FILE: doc/general/CfgEdge.md
================================================
CfgEdge
====================

A **CfgEdge** represents an edge in the interprocedural
[control flow graph](CFG.md) (CFG).

The corresponding Protobuf message type is `Edge`.


- A **CfgEdge** may optionally store a [CfgEdgeLabel](CfgEdgeLabel.md).

- There are no guaranteed properties for the **CFG**. There are,
  however, guaranteed properties for constituent component
  [CfgEdgeLabel](CfgEdgeLabel.md).


API Implementations
--------------------

| Language    | CfgEdge Implementation                            |
|:------------|:--------------------------------------------------|
| C++         | no explicit type: add edges with gtirb::addEdge() |
| Python      | gtirb.Edge                                        |
| Common Lisp | see [http://eschulte.github.io/graph/](http://eschulte.github.io/graph/). Edges in the CFG are labeled with **edge-label** objects. |


Links
--------------------

- [Advice on when to Place ICFG Edges](../CFG-Edges.md)
- [GTIRB Components](COMPONENTS.md)
- [Using Serialized GTIRB Data](../../PROTOBUF.md)


================================================
FILE: doc/general/CfgEdgeLabel.md
================================================
CfgEdgeLabel
====================

A **CfgEdgeLabel** represents the optional label on an edge
([CfgEdge](CfgEdge.md)) in the interprocedural [control flow
graph](CFG.md) (CFG).

The corresponding Protobuf message type is `EdgeLabel`.


Guaranteed Properties
---------------------

- Each **CfgEdgeLabel** object must have the following information,
  and the API must provide functionality for getting and setting each.
  - **conditional**
  - **direct**
  - **type**


API Implementations
--------------------

| Language    | CfgEdgeLabel Implementation             |
|:------------|:----------------------------------------|
| C++         | gtirb::EdgeLabel                        |
| Python      | gtirb.Label (inner class of gtirb.Edge) |
| Common Lisp | **edge-label**                          |


### Required Field Getters/Setters


#### conditional

| Language    | Get/Set conditional | Get/Set conditional |
|:------------|:--------------------|:--------------------|
| C++         | read std::get<ConditionalEdge>(E) for gtirb::EdgeLabel E | read std::get<ConditionalEdge>(E) for gtirb::EdgeLabel E |
| Python      | read gtirb.CFG.label.conditional | write gtirb.CFG.label.conditional |
| Common Lisp | **conditional** (*obj* *edge-label*) => *result* | (setf (**conditional** (*obj* *edge-label*)) *new*) |


#### direct

| Language    | Get direct | Set direct |
|:------------|:-----------|:-----------|
| C++         | read std::get<DirectEdge>(E) for gtirb::EdgeLabel E | read std::get<DirectEdge>(E) for gtirb::EdgeLabel E |
| Python      | read gtirb.CFG.label.direct | write gtirb.CFG.label.direct |
| Common Lisp | **direct** (*obj* *edge-label*) => *result* | (setf (**direct** (*obj* *edge-label*)) *new*) |


#### type

| Language    | Get type | Set type |
|:------------|:---------|:---------|
| C++         |  read std::get<EdgeType>(E) for gtirb::EdgeLabel E | read std::get<EdgeType>(E) for gtirb::EdgeLabel E |
| Python      | read gtirb.CFG.label.type | write gtirb.CFG.label.type |
| Common Lisp | **edge-type** (*obj* *edge-label*) => *result* | (setf (**edge-type** (*obj* *edge-label*)) *new*) |


Links
--------------------

- [Advice on when to Place ICFG Edges](../CFG-Edges.md)
- [GTIRB Components](COMPONENTS.md)
- [Using Serialized GTIRB Data](../../PROTOBUF.md)


================================================
FILE: doc/general/CfgNode.md
================================================
CfgNode
====================

**CfgNode** represents a base class for blocks that may appear as
vertices in the control flow graph (CFG).

Guaranteed Properties
---------------------

- A **CfgNode** is a [Node](Node.md).


API Implementations
--------------------

The guaranteed functionality is provided as follows.

### CfgNode Classes

| Language    | CfgNode Class  |
|:------------|:---------------|
| C++         | gtirb::CfgNode |
| Python      | gtirb.CfgNode  |
| Common Lisp | see [http://eschulte.github.io/graph/](http://eschulte.github.io/graph/). Nodes in the CFG contain the UUIDs of **code-block** objects which can be looked up using **get-uuid**. |


Links
--------------------

- [Advice on when to Place ICFG Edges](../CFG-Edges.md)
- [GTIRB Components](COMPONENTS.md)
- [Using Serialized GTIRB Data](../../PROTOBUF.md)


================================================
FILE: doc/general/CodeBlock.md
================================================
CodeBlock
====================

A **CodeBlock** represents a basic block in the binary.

The corresponding Protobuf message type is `CodeBlock`.


Guaranteed Properties
---------------------

- A **CodeBlock** is a [ByteBlock](ByteBlock.md) and a [CfgNode](CfgNode.md).

- Each **CodeBlock** must store its **decode_mode**, and this value
  must be readable and writable.


API Implementations
--------------------

The guaranteed functionality is provided as follows.

### CodeBlock Classes

| Language    | CodeBlock Class  |
|:------------|:-----------------|
| C++         | gtirb::CodeBlock |
| Python      | gtirb.CodeBlock  |
| Common Lisp | **code-block**   |


### decode_mode Getters/Setters

| Language    | Get decode_mode           | Set decode_mode           |
|:------------|:--------------------------|:--------------------------|
| C++         | gtirb::CodeBlock::getDecodeMode() | gtirb::Section::setDecodeMode() |
| Python      | read gtirb.CodeBlock.decode_mode | write gtirb.CodeBlock.decode_mode  |
| Common Lisp | **decode-mode** (*obj* *code-block*) => *result* | (setf (**decode-mode** (*obj* *code-block*)) *new*) |


Links
--------------------

- [GTIRB Components](COMPONENTS.md)
- [Using Serialized GTIRB Data](../../PROTOBUF.md)


================================================
FILE: doc/general/DataBlock.md
================================================
DataBlock
====================

A **DataBlock** represents a data object, possibly symbolic.

The corresponding Protobuf message type is `DataBlock`.


Guaranteed Properties
---------------------

- A **DataBlock** is a [ByteBlock](ByteBlock.md).


API Implementations
--------------------

The guaranteed functionality is provided as follows.

### DataBlock Classes

| Language    | DataBlock Class  |
|:------------|:-----------------|
| C++         | gtirb::DataBlock |
| Python      | gtirb.DataBlock  |
| Common Lisp | **data-block**   |


Links
--------------------

- [GTIRB Components](COMPONENTS.md)
- [Using Serialized GTIRB Data](../../PROTOBUF.md)


================================================
FILE: doc/general/Doxyfile.in
================================================
# Doxyfile 1.8.11

# This file describes the settings to be used by the documentation system
# doxygen (www.doxygen.org) for a project.
#
# All text after a double hash (##) is considered a comment and is placed in
# front of the TAG it is preceding.
#
# All text after a single hash (#) is considered a comment and will be ignored.
# The format is:
# TAG = value [value, ...]
# For lists, items can also be appended using:
# TAG += value [value, ...]
# Values that contain spaces should be placed between quotes (\" \").

#---------------------------------------------------------------------------
# Project related configuration options
#---------------------------------------------------------------------------

# This tag specifies the encoding used for all characters in the config file
# that follow. The default is UTF-8 which is also the encoding used for all text
# before the first occurrence of this tag. Doxygen uses libiconv (or the iconv
# built into libc) for the transcoding. See http://www.gnu.org/software/libiconv
# for the list of possible encodings.
# The default value is: UTF-8.

DOXYFILE_ENCODING      = UTF-8

# The PROJECT_NAME tag is a single word (or a sequence of words surrounded by
# double-quotes, unless you are using Doxywizard) that should identify the
# project for which the documentation is generated. This name is used in the
# title of most generated pages and in a few other places.
# The default value is: My Project.

PROJECT_NAME           = GTIRB

# The PROJECT_NUMBER tag can be used to enter a project or revision number. This
# could be handy for archiving the generated documentation or if some version
# control system is used.

PROJECT_NUMBER         = v@GTIRB_MAJOR_VERSION@.@GTIRB_MINOR_VERSION@.@GTIRB_PATCH_VERSION@

# Using the PROJECT_BRIEF tag one can provide an optional one line description
# for a project that appears at the top of each page and should give viewer a
# quick idea about the purpose of the project. Keep the description short.

PROJECT_BRIEF          = "GrammaTech Intermediate Representation for Binaries"

# With the PROJECT_LOGO tag one can specify a logo or an icon that is included
# in the documentation. The maximum height of the logo should not exceed 55
# pixels and the maximum width should not exceed 200 pixels. Doxygen will copy
# the logo to the output directory.

PROJECT_LOGO           =

# The OUTPUT_DIRECTORY tag is used to specify the (relative or absolute) path
# into which the generated documentation will be written. If a relative path is
# entered, it will be relative to the location where doxygen was started. If
# left blank the current directory will be used.

OUTPUT_DIRECTORY       = @CMAKE_BINARY_DIR@/doc

# If the CREATE_SUBDIRS tag is set to YES then doxygen will create 4096 sub-
# directories (in 2 levels) under the output directory of each output format and
# will distribute the generated files over these directories. Enabling this
# option can be useful when feeding doxygen a huge amount of source files, where
# putting all generated files in the same directory would otherwise causes
# performance problems for the file system.
# The default value is: NO.

CREATE_SUBDIRS         = NO

# If the ALLOW_UNICODE_NAMES tag is set to YES, doxygen will allow non-ASCII
# characters to appear in the names of generated files. If set to NO, non-ASCII
# characters will be escaped, for example _xE3_x81_x84 will be used for Unicode
# U+3044.
# The default value is: NO.

ALLOW_UNICODE_NAMES    = NO

# The OUTPUT_LANGUAGE tag is used to specify the language in which all
# documentation generated by doxygen is written. Doxygen will use this
# information to generate all constant output in the proper language.
# Possible values are: Afrikaans, Arabic, Armenian, Brazilian, Catalan, Chinese,
# Chinese-Traditional, Croatian, Czech, Danish, Dutch, English (United States),
# Esperanto, Farsi (Persian), Finnish, French, German, Greek, Hungarian,
# Indonesian, Italian, Japanese, Japanese-en (Japanese with English messages),
# Korean, Korean-en (Korean with English messages), Latvian, Lithuanian,
# Macedonian, Norwegian, Persian (Farsi), Polish, Portuguese, Romanian, Russian,
# Serbian, Serbian-Cyrillic, Slovak, Slovene, Spanish, Swedish, Turkish,
# Ukrainian and Vietnamese.
# The default value is: English.

OUTPUT_LANGUAGE        = English

# If the BRIEF_MEMBER_DESC tag is set to YES, doxygen will include brief member
# descriptions after the members that are listed in the file and class
# documentation (similar to Javadoc). Set to NO to disable this.
# The default value is: YES.

BRIEF_MEMBER_DESC      = YES

# If the REPEAT_BRIEF tag is set to YES, doxygen will prepend the brief
# description of a member or function before the detailed description
#
# Note: If both HIDE_UNDOC_MEMBERS and BRIEF_MEMBER_DESC are set to NO, the
# brief descriptions will be completely suppressed.
# The default value is: YES.

REPEAT_BRIEF           = YES

# This tag implements a quasi-intelligent brief description abbreviator that is
# used to form the text in various listings. Each string in this list, if found
# as the leading text of the brief description, will be stripped from the text
# and the result, after processing the whole list, is used as the annotated
# text. Otherwise, the brief description is used as-is. If left blank, the
# following values are used ($name is automatically replaced with the name of
# the entity):The $name class, The $name widget, The $name file, is, provides,
# specifies, contains, represents, a, an and the.

ABBREVIATE_BRIEF       = "The $name class" \
                         "The $name widget" \
                         "The $name file" \
                         is \
                         provides \
                         specifies \
                         contains \
                         represents \
                         a \
                         an \
                         the

# If the ALWAYS_DETAILED_SEC and REPEAT_BRIEF tags are both set to YES then
# doxygen will generate a detailed section even if there is only a brief
# description.
# The default value is: NO.

ALWAYS_DETAILED_SEC    = NO

# If the INLINE_INHERITED_MEMB tag is set to YES, doxygen will show all
# inherited members of a class in the documentation of that class as if those
# members were ordinary class members. Constructors, destructors and assignment
# operators of the base classes will not be shown.
# The default value is: NO.

INLINE_INHERITED_MEMB  = NO

# If the FULL_PATH_NAMES tag is set to YES, doxygen will prepend the full path
# before files name in the file list and in the header files. If set to NO the
# shortest path that makes the file name unique will be used
# The default value is: YES.

FULL_PATH_NAMES        = NO

# The STRIP_FROM_PATH tag can be used to strip a user-defined part of the path.
# Stripping is only done if one of the specified strings matches the left-hand
# part of the path. The tag can be used to show relative paths in the file list.
# If left blank the directory from which doxygen is run is used as the path to
# strip.
#
# Note that you can specify absolute paths here, but also relative paths, which
# will be relative from the directory where doxygen is started.
# This tag requires that the tag FULL_PATH_NAMES is set to YES.

STRIP_FROM_PATH        = .

# The STRIP_FROM_INC_PATH tag can be used to strip a user-defined part of the
# path mentioned in the documentation of a class, which tells the reader which
# header file to include in order to use a class. If left blank only the name of
# the header file containing the class definition is used. Otherwise one should
# specify the list of include paths that are normally passed to the compiler
# using the -I flag.

STRIP_FROM_INC_PATH    =

# If the SHORT_NAMES tag is set to YES, doxygen will generate much shorter (but
# less readable) file names. This can be useful is your file systems doesn't
# support long names like on DOS, Mac, or CD-ROM.
# The default value is: NO.

SHORT_NAMES            = NO

# If the JAVADOC_AUTOBRIEF tag is set to YES then doxygen will interpret the
# first line (until the first dot) of a Javadoc-style comment as the brief
# description. If set to NO, the Javadoc-style will behave just like regular Qt-
# style comments (thus requiring an explicit @brief command for a brief
# description.)
# The default value is: NO.

JAVADOC_AUTOBRIEF      = NO

# If the QT_AUTOBRIEF tag is set to YES then doxygen will interpret the first
# line (until the first dot) of a Qt-style comment as the brief description. If
# set to NO, the Qt-style will behave just like regular Qt-style comments (thus
# requiring an explicit \brief command for a brief description.)
# The default value is: NO.

QT_AUTOBRIEF           = NO

# The MULTILINE_CPP_IS_BRIEF tag can be set to YES to make doxygen treat a
# multi-line C++ special comment block (i.e. a block of //! or /// comments) as
# a brief description. This used to be the default behavior. The new default is
# to treat a multi-line C++ comment block as a detailed description. Set this
# tag to YES if you prefer the old behavior instead.
#
# Note that setting this tag to YES also means that rational rose comments are
# not recognized any more.
# The default value is: NO.

MULTILINE_CPP_IS_BRIEF = NO

# If the INHERIT_DOCS tag is set to YES then an undocumented member inherits the
# documentation from any documented member that it re-implements.
# The default value is: YES.

INHERIT_DOCS           = YES

# If the SEPARATE_MEMBER_PAGES tag is set to YES then doxygen will produce a new
# page for each member. If set to NO, the documentation of a member will be part
# of the file/class/namespace that contains it.
# The default value is: NO.

SEPARATE_MEMBER_PAGES  = NO

# The TAB_SIZE tag can be used to set the number of spaces in a tab. Doxygen
# uses this value to replace tabs by spaces in code fragments.
# Minimum value: 1, maximum value: 16, default value: 4.

TAB_SIZE               = 4

# This tag can be used to specify a number of aliases that act as commands in
# the documentation. An alias has the form:
# name=value
# For example adding
# "sideeffect=@par Side Effects:\n"
# will allow you to put the command \sideeffect (or @sideeffect) in the
# documentation, which will result in a user-defined paragraph with heading
# "Side Effects:". You can put \n's in the value part of an alias to insert
# newlines.

ALIASES                =

# This tag can be used to specify a number of word-keyword mappings (TCL only).
# A mapping has the form "name=value". For example adding "class=itcl::class"
# will allow you to use the command class in the itcl::class meaning.

TCL_SUBST              =

# Set the OPTIMIZE_OUTPUT_FOR_C tag to YES if your project consists of C sources
# only. Doxygen will then generate output that is more tailored for C. For
# instance, some of the names that are used will be different. The list of all
# members will be omitted, etc.
# The default value is: NO.

OPTIMIZE_OUTPUT_FOR_C  = NO

# Set the OPTIMIZE_OUTPUT_JAVA tag to YES if your project consists of Java or
# Python sources only. Doxygen will then generate output that is more tailored
# for that language. For instance, namespaces will be presented as packages,
# qualified scopes will look different, etc.
# The default value is: NO.

OPTIMIZE_OUTPUT_JAVA   = NO

# Set the OPTIMIZE_FOR_FORTRAN tag to YES if your project consists of Fortran
# sources. Doxygen will then generate output that is tailored for Fortran.
# The default value is: NO.

OPTIMIZE_FOR_FORTRAN   = NO

# Set the OPTIMIZE_OUTPUT_VHDL tag to YES if your project consists of VHDL
# sources. Doxygen will then generate output that is tailored for VHDL.
# The default value is: NO.

OPTIMIZE_OUTPUT_VHDL   = NO

# Doxygen selects the parser to use depending on the extension of the files it
# parses. With this tag you can assign which parser to use for a given
# extension. Doxygen has a built-in mapping, but you can override or extend it
# using this tag. The format is ext=language, where ext is a file extension, and
# language is one of the parsers supported by doxygen: IDL, Java, Javascript,
# C#, C, C++, D, PHP, Objective-C, Python, Fortran (fixed format Fortran:
# FortranFixed, free formatted Fortran: FortranFree, unknown formatted Fortran:
# Fortran. In the later case the parser tries to guess whether the code is fixed
# or free formatted code, this is the default for Fortran type files), VHDL. For
# instance to make doxygen treat .inc files as Fortran files (default is PHP),
# and .f files as C (default is Fortran), use: inc=Fortran f=C.
#
# Note: For files without extension you can use no_extension as a placeholder.
#
# Note that for custom extensions you also need to set FILE_PATTERNS otherwise
# the files are not read by doxygen.

EXTENSION_MAPPING      =

# If the MARKDOWN_SUPPORT tag is enabled then doxygen pre-processes all comments
# according to the Markdown format, which allows for more readable
# documentation. See http://daringfireball.net/projects/markdown/ for details.
# The output of markdown processing is further processed by doxygen, so you can
# mix doxygen, HTML, and XML commands with Markdown formatting. Disable only in
# case of backward compatibilities issues.
# The default value is: YES.

MARKDOWN_SUPPORT       = YES

TOC_INCLUDE_HEADINGS   = 4


# When enabled doxygen tries to link words that correspond to documented
# classes, or namespaces to their corresponding documentation. Such a link can
# be prevented in individual cases by putting a % sign in front of the word or
# globally by setting AUTOLINK_SUPPORT to NO.
# The default value is: YES.

AUTOLINK_SUPPORT       = YES

# If you use STL classes (i.e. std::string, std::vector, etc.) but do not want
# to include (a tag file for) the STL sources as input, then you should set this
# tag to YES in order to let doxygen match functions declarations and
# definitions whose arguments contain STL classes (e.g. func(std::string);
# versus func(std::string) {}). This also make the inheritance and collaboration
# diagrams that involve STL classes more complete and accurate.
# The default value is: NO.

BUILTIN_STL_SUPPORT    = NO

# If you use Microsoft's C++/CLI language, you should set this option to YES to
# enable parsing support.
# The default value is: NO.

CPP_CLI_SUPPORT        = NO

# Set the SIP_SUPPORT tag to YES if your project consists of sip (see:
# http://www.riverbankcomputing.co.uk/software/sip/intro) sources only. Doxygen
# will parse them like normal C++ but will assume all classes use public instead
# of private inheritance when no explicit protection keyword is present.
# The default value is: NO.

SIP_SUPPORT            = NO

# For Microsoft's IDL there are propget and propput attributes to indicate
# getter and setter methods for a property. Setting this option to YES will make
# doxygen to replace the get and set methods by a property in the documentation.
# This will only work if the methods are indeed getting or setting a simple
# type. If this is not the case, or you want to show the methods anyway, you
# should set this option to NO.
# The default value is: YES.

IDL_PROPERTY_SUPPORT   = YES

# If member grouping is used in the documentation and the DISTRIBUTE_GROUP_DOC
# tag is set to YES then doxygen will reuse the documentation of the first
# member in the group (if any) for the other members of the group. By default
# all members of a group must be documented explicitly.
# The default value is: NO.

DISTRIBUTE_GROUP_DOC   = NO

# If one adds a struct or class to a group and this option is enabled, then also
# any nested class or struct is added to the same group. By default this option
# is disabled and one has to add nested compounds explicitly via \ingroup.
# The default value is: NO.

GROUP_NESTED_COMPOUNDS = NO

# Set the SUBGROUPING tag to YES to allow class member groups of the same type
# (for instance a group of public functions) to be put as a subgroup of that
# type (e.g. under the Public Functions section). Set it to NO to prevent
# subgrouping. Alternatively, this can be done per class using the
# \nosubgrouping command.
# The default value is: YES.

SUBGROUPING            = YES

# When the INLINE_GROUPED_CLASSES tag is set to YES, classes, structs and unions
# are shown inside the group in which they are included (e.g. using \ingroup)
# instead of on a separate page (for HTML and Man pages) or section (for LaTeX
# and RTF).
#
# Note that this feature does not work in combination with
# SEPARATE_MEMBER_PAGES.
# The default value is: NO.

INLINE_GROUPED_CLASSES = NO

# When the INLINE_SIMPLE_STRUCTS tag is set to YES, structs, classes, and unions
# with only public data fields or simple typedef fields will be shown inline in
# the documentation of the scope in which they are defined (i.e. file,
# namespace, or group documentation), provided this scope is documented. If set
# to NO, structs, classes, and unions are shown on a separate page (for HTML and
# Man pages) or section (for LaTeX and RTF).
# The default value is: NO.

INLINE_SIMPLE_STRUCTS  = NO

# When TYPEDEF_HIDES_STRUCT tag is enabled, a typedef of a struct, union, or
# enum is documented as struct, union, or enum with the name of the typedef. So
# typedef struct TypeS {} TypeT, will appear in the documentation as a struct
# with name TypeT. When disabled the typedef will appear as a member of a file,
# namespace, or class. And the struct will be named TypeS. This can typically be
# useful for C code in case the coding convention dictates that all compound
# types are typedef'ed and only the typedef is referenced, never the tag name.
# The default value is: NO.

TYPEDEF_HIDES_STRUCT   = YES

# The size of the symbol lookup cache can be set using LOOKUP_CACHE_SIZE. This
# cache is used to resolve symbols given their name and scope. Since this can be
# an expensive process and often the same symbol appears multiple times in the
# code, doxygen keeps a cache of pre-resolved symbols. If the cache is too small
# doxygen will become slower. If the cache is too large, memory is wasted. The
# cache size is given by this formula: 2^(16+LOOKUP_CACHE_SIZE). The valid range
# is 0..9, the default is 0, corresponding to a cache size of 2^16=65536
# symbols. At the end of a run doxygen will report the cache usage and suggest
# the optimal cache size from a speed point of view.
# Minimum value: 0, maximum value: 9, default value: 0.

LOOKUP_CACHE_SIZE      = 0

#---------------------------------------------------------------------------
# Build related configuration options
#---------------------------------------------------------------------------

# If the EXTRACT_ALL tag is set to YES, doxygen will assume all entities in
# documentation are documented, even if no documentation was available. Private
# class members and static file members will be hidden unless the
# EXTRACT_PRIVATE respectively EXTRACT_STATIC tags are set to YES.
# Note: This will also disable the warnings about undocumented members that are
# normally produced when WARNINGS is set to YES.
# The default value is: NO.

EXTRACT_ALL            = YES

# If the EXTRACT_PRIVATE tag is set to YES, all private members of a class will
# be included in the documentation.
# The default value is: NO.

EXTRACT_PRIVATE        = NO

# If the EXTRACT_PACKAGE tag is set to YES, all members with package or internal
# scope will be included in the documentation.
# The default value is: NO.

EXTRACT_PACKAGE        = NO

# If the EXTRACT_STATIC tag is set to YES, all static members of a file will be
# included in the documentation.
# The default value is: NO.

EXTRACT_STATIC         = NO

# If the EXTRACT_LOCAL_CLASSES tag is set to YES, classes (and structs) defined
# locally in source files will be included in the documentation. If set to NO,
# only classes defined in header files are included. Does not have any effect
# for Java sources.
# The default value is: YES.

EXTRACT_LOCAL_CLASSES  = YES

# This flag is only useful for Objective-C code. If set to YES, local methods,
# which are defined in the implementation section but not in the interface are
# included in the documentation. If set to NO, only methods in the interface are
# included.
# The default value is: NO.

EXTRACT_LOCAL_METHODS  = NO

# If this flag is set to YES, the members of anonymous namespaces will be
# extracted and appear in the documentation as a namespace called
# 'anonymous_namespace{file}', where file will be replaced with the base name of
# the file that contains the anonymous namespace. By default anonymous namespace
# are hidden.
# The default value is: NO.

EXTRACT_ANON_NSPACES   = YES

# If the HIDE_UNDOC_MEMBERS tag is set to YES, doxygen will hide all
# undocumented members inside documented classes or files. If set to NO these
# members will be included in the various overviews, but no documentation
# section is generated. This option has no effect if EXTRACT_ALL is enabled.
# The default value is: NO.

HIDE_UNDOC_MEMBERS     = NO

# If the HIDE_UNDOC_CLASSES tag is set to YES, doxygen will hide all
# undocumented classes that are normally visible in the class hierarchy. If set
# to NO, these classes will be included in the various overviews. This option
# has no effect if EXTRACT_ALL is enabled.
# The default value is: NO.

HIDE_UNDOC_CLASSES     = NO

# If the HIDE_FRIEND_COMPOUNDS tag is set to YES, doxygen will hide all friend
# (class|struct|union) declarations. If set to NO, these declarations will be
# included in the documentation.
# The default value is: NO.

HIDE_FRIEND_COMPOUNDS  = NO

# If the HIDE_IN_BODY_DOCS tag is set to YES, doxygen will hide any
# documentation blocks found inside the body of a function. If set to NO, these
# blocks will be appended to the function's detailed documentation block.
# The default value is: NO.

HIDE_IN_BODY_DOCS      = NO

# The INTERNAL_DOCS tag determines if documentation that is typed after a
# \internal command is included. If the tag is set to NO then the documentation
# will be excluded. Set it to YES to include the internal documentation.
# The default value is: NO.

INTERNAL_DOCS          = NO

# If the CASE_SENSE_NAMES tag is set to NO then doxygen will only generate file
# names in lower-case letters. If set to YES, upper-case letters are also
# allowed. This is useful if you have classes or files whose names only differ
# in case and if your file system supports case sensitive file names. Windows
# and Mac users are advised to set this option to NO.
# The default value is: system dependent.

CASE_SENSE_NAMES       = NO

# If the HIDE_SCOPE_NAMES tag is set to NO then doxygen will show members with
# their full class and namespace scopes in the documentation. If set to YES, the
# scope will be hidden.
# The default value is: NO.

HIDE_SCOPE_NAMES       = NO

# If the HIDE_COMPOUND_REFERENCE tag is set to NO (default) then doxygen will
# append additional text to a page's title, such as Class Reference. If set to
# YES the compound reference will be hidden.
# The default value is: NO.

HIDE_COMPOUND_REFERENCE= NO

# If the SHOW_INCLUDE_FILES tag is set to YES then doxygen will put a list of
# the files that are included by a file in the documentation of that file.
# The default value is: YES.

SHOW_INCLUDE_FILES     = YES

# If the SHOW_GROUPED_MEMB_INC tag is set to YES then Doxygen will add for each
# grouped member an include statement to the documentation, telling the reader
# which file to include in order to use the member.
# The default value is: NO.

SHOW_GROUPED_MEMB_INC  = YES

# If the FORCE_LOCAL_INCLUDES tag is set to YES then doxygen will list include
# files with double quotes in the documentation rather than with sharp brackets.
# The default value is: NO.

FORCE_LOCAL_INCLUDES   = NO

# If the INLINE_INFO tag is set to YES then a tag [inline] is inserted in the
# documentation for inline members.
# The default value is: YES.

INLINE_INFO            = YES

# If the SORT_MEMBER_DOCS tag is set to YES then doxygen will sort the
# (detailed) documentation of file and class members alphabetically by member
# name. If set to NO, the members will appear in declaration order.
# The default value is: YES.

SORT_MEMBER_DOCS       = YES

# If the SORT_BRIEF_DOCS tag is set to YES then doxygen will sort the brief
# descriptions of file, namespace and class members alphabetically by member
# name. If set to NO, the members will appear in declaration order. Note that
# this will also influence the order of the classes in the class list.
# The default value is: NO.

SORT_BRIEF_DOCS        = YES

# If the SORT_MEMBERS_CTORS_1ST tag is set to YES then doxygen will sort the
# (brief and detailed) documentation of class members so that constructors and
# destructors are listed first. If set to NO the constructors will appear in the
# respective orders defined by SORT_BRIEF_DOCS and SORT_MEMBER_DOCS.
# Note: If SORT_BRIEF_DOCS is set to NO this option is ignored for sorting brief
# member documentation.
# Note: If SORT_MEMBER_DOCS is set to NO this option is ignored for sorting
# detailed member documentation.
# The default value is: NO.

SORT_MEMBERS_CTORS_1ST = YES

# If the SORT_GROUP_NAMES tag is set to YES then doxygen will sort the hierarchy
# of group names into alphabetical order. If set to NO the group names will
# appear in their defined order.
# The default value is: NO.

SORT_GROUP_NAMES       = YES

# If the SORT_BY_SCOPE_NAME tag is set to YES, the class list will be sorted by
# fully-qualified names, including namespaces. If set to NO, the class list will
# be sorted only by class name, not including the namespace part.
# Note: This option is not very useful if HIDE_SCOPE_NAMES is set to YES.
# Note: This option applies only to the class list, not to the alphabetical
# list.
# The default value is: NO.

SORT_BY_SCOPE_NAME     = NO

# If the STRICT_PROTO_MATCHING option is enabled and doxygen fails to do proper
# type resolution of all parameters of a function it will reject a match between
# the prototype and the implementation of a member function even if there is
# only one candidate or it is obvious which candidate to choose by doing a
# simple string match. By disabling STRICT_PROTO_MATCHING doxygen will still
# accept a match between prototype and implementation in such cases.
# The default value is: NO.

STRICT_PROTO_MATCHING  = NO

# The GENERATE_TODOLIST tag can be used to enable (YES) or disable (NO) the todo
# list. This list is created by putting \todo commands in the documentation.
# The default value is: YES.

GENERATE_TODOLIST      = YES

# The GENERATE_TESTLIST tag can be used to enable (YES) or disable (NO) the test
# list. This list is created by putting \test commands in the documentation.
# The default value is: YES.

GENERATE_TESTLIST      = YES

# The GENERATE_BUGLIST tag can be used to enable (YES) or disable (NO) the bug
# list. This list is created by putting \bug commands in the documentation.
# The default value is: YES.

GENERATE_BUGLIST       = YES

# The GENERATE_DEPRECATEDLIST tag can be used to enable (YES) or disable (NO)
# the deprecated list. This list is created by putting \deprecated commands in
# the documentation.
# The default value is: YES.

GENERATE_DEPRECATEDLIST= YES

# The ENABLED_SECTIONS tag can be used to enable conditional documentation
# sections, marked by \if <section_label> ... \endif and \cond <section_label>
# ... \endcond blocks.

ENABLED_SECTIONS       = @CPP_DOX_ENABLED@ @CL_DOX_ENABLED@ @PY_DOX_ENABLED@

# The MAX_INITIALIZER_LINES tag determines the maximum number of lines that the
# initial value of a variable or macro / define can have for it to appear in the
# documentation. If the initializer consists of more lines than specified here
# it will be hidden. Use a value of 0 to hide initializers completely. The
# appearance of the value of individual variables and macros / defines can be
# controlled using \showinitializer or \hideinitializer command in the
# documentation regardless of this setting.
# Minimum value: 0, maximum value: 10000, default value: 30.

MAX_INITIALIZER_LINES  = 30

# Set the SHOW_USED_FILES tag to NO to disable the list of files generated at
# the bottom of the documentation of classes and structs. If set to YES, the
# list will mention the files that were used to generate the documentation.
# The default value is: YES.

SHOW_USED_FILES        = YES

# Set the SHOW_FILES tag to NO to disable the generation of the Files page. This
# will remove the Files entry from the Quick Index and from the Folder Tree View
# (if specified).
# The default value is: YES.

SHOW_FILES             = YES

# Set the SHOW_NAMESPACES tag to NO to disable the generation of the Namespaces
# page. This will remove the Namespaces entry from the Quick Index and from the
# Folder Tree View (if specified).
# The default value is: YES.

SHOW_NAMESPACES        = YES

# The FILE_VERSION_FILTER tag can be used to specify a program or script that
# doxygen should invoke to get the current version for each file (typically from
# the version control system). Doxygen will invoke the program by executing (via
# popen()) the command command input-file, where command is the value of the
# FILE_VERSION_FILTER tag, and input-file is the name of an input file provided
# by doxygen. Whatever the program writes to standard output is used as the file
# version. For an example see the documentation.

FILE_VERSION_FILTER    =

# The LAYOUT_FILE tag can be used to specify a layout file which will be parsed
# by doxygen. The layout file controls the global structure of the generated
# output files in an output format independent way. To create the layout file
# that represents doxygen's defaults, run doxygen with the -l option. You can
# optionally specify a file name after the option, if omitted DoxygenLayout.xml
# will be used as the name of the layout file.
#
# Note that if you run doxygen from a directory containing a file called
# DoxygenLayout.xml, doxygen will parse it automatically even if the LAYOUT_FILE
# tag is left empty.

LAYOUT_FILE            =

# The CITE_BIB_FILES tag can be used to specify one or more bib files containing
# the reference definitions. This must be a list of .bib files. The .bib
# extension is automatically appended if omitted. This requires the bibtex tool
# to be installed. See also http://en.wikipedia.org/wiki/BibTeX for more info.
# For LaTeX the style of the bibliography can be controlled using
# LATEX_BIB_STYLE. To use this feature you need bibtex and perl available in the
# search path. See also \cite for info how to create references.

CITE_BIB_FILES         =

#---------------------------------------------------------------------------
# Configuration options related to warning and progress messages
#---------------------------------------------------------------------------

# The QUIET tag can be used to turn on/off the messages that are generated to
# standard output by doxygen. If QUIET is set to YES this implies that the
# messages are off.
# The default value is: NO.

QUIET                  = NO

# The WARNINGS tag can be used to turn on/off the warning messages that are
# generated to standard error (stderr) by doxygen. If WARNINGS is set to YES
# this implies that the warnings are on.
#
# Tip: Turn warnings on while writing the documentation.
# The default value is: YES.

WARNINGS               = YES

# If the WARN_IF_UNDOCUMENTED tag is set to YES then doxygen will generate
# warnings for undocumented members. If EXTRACT_ALL is set to YES then this flag
# will automatically be disabled.
# The default value is: YES.

WARN_IF_UNDOCUMENTED   = YES

# If the WARN_IF_DOC_ERROR tag is set to YES, doxygen will generate warnings for
# potential errors in the documentation, such as not documenting some parameters
# in a documented function, or documenting parameters that don't exist or using
# markup commands wrongly.
# The default value is: YES.

WARN_IF_DOC_ERROR      = YES

# This WARN_NO_PARAMDOC option can be enabled to get warnings for functions that
# are documented, but have no documentation for their parameters or return
# value. If set to NO, doxygen will only warn about wrong or incomplete
# parameter documentation, but not about the absence of documentation.
# The default value is: NO.

WARN_NO_PARAMDOC       = NO

# If the WARN_AS_ERROR tag is set to YES then doxygen will immediately stop when
# a warning is encountered.
# The default value is: NO.

WARN_AS_ERROR          = NO

# The WARN_FORMAT tag determines the format of the warning messages that doxygen
# can produce. The string should contain the $file, $line, and $text tags, which
# will be replaced by the file and line number from which the warning originated
# and the warning text. Optionally the format may contain $version, which will
# be replaced by the version of the file (if it could be obtained via
# FILE_VERSION_FILTER)
# The default value is: $file:$line: $text.

WARN_FORMAT            = "$file:$line: $text"

# The WARN_LOGFILE tag can be used to specify a file to which warning and error
# messages should be written. If left blank the output is written to standard
# error (stderr).

WARN_LOGFILE           = doxygen_warnings.txt

#---------------------------------------------------------------------------
# Configuration options related to the input files
#---------------------------------------------------------------------------

# The INPUT tag is used to specify the files and/or directories that contain
# documented source files. You may enter file names like myfile.cpp or
# directories like /usr/src/myproject. Separate the files or directories with
# spaces. See also FILE_PATTERNS and EXTENSION_MAPPING
# Note: If this tag is empty the current directory is searched.

# Explicitly naming the .md files allows us to force an order in the
# TOC (otherwise it will be alphabetical)

INPUT   += README.md FAQ.md PROTOBUF.md CFG-Edges.md AuxData.md CONTRIBUTING.md
INPUT   += AuxDataContainer.md Block.md ByteBlock.md ByteInterval.md
INPUT   += CFG.md CfgEdge.md CfgEdgeLabel.md CfgNode.md CodeBlock.md
INPUT   += COMPONENTS.md DataBlock.md IR.md Module.md Node.md ProxyBlock.md
INPUT   += Section.md Symbol.md SymbolicExpression.md SymAddrAddr.md
INPUT   += SymAddrConst.md Version.md stack-stamp.md
INPUT   += binary-representation.md
INPUT   += examples.dox
INPUT   += images.dox


# This tag can be used to specify the character encoding of the source files
# that doxygen parses. Internally doxygen uses the UTF-8 encoding. Doxygen uses
# libiconv (or the iconv built into libc) for the transcoding. See the libiconv
# documentation (see: http://www.gnu.org/software/libiconv) for the list of
# possible encodings.
# The default value is: UTF-8.

INPUT_ENCODING         = UTF-8

# If the value of the INPUT tag contains directories, you can use the
# FILE_PATTERNS tag to specify one or more wildcard patterns (like *.cpp and
# *.h) to filter out the source-files in the directories.
#
# Note that for custom extensions or not directly supported extensions you also
# need to set EXTENSION_MAPPING for the extension otherwise the files are not
# read by doxygen.
#
# If left blank the following patterns are tested:*.c, *.cc, *.cxx, *.cpp,
# *.c++, *.java, *.ii, *.ixx, *.ipp, *.i++, *.inl, *.idl, *.ddl, *.odl, *.h,
# *.hh, *.hxx, *.hpp, *.h++, *.cs, *.d, *.php, *.php4, *.php5, *.phtml, *.inc,
# *.m, *.markdown, *.md, *.mm, *.dox, *.py, *.pyw, *.f90, *.f, *.for, *.tcl,
# *.vhd, *.vhdl, *.ucf, *.qsf, *.as and *.js.

FILE_PATTERNS          = *.c \
                         *.cc \
                         *.cxx \
                         *.cpp \
                         *.c++ \
                         *.java \
                         *.ii \
                         *.ixx \
                         *.ipp \
                         *.i++ \
                         *.inl \
                         *.idl \
                         *.ddl \
                         *.odl \
                         *.h \
                         *.hh \
                         *.hxx \
                         *.hpp \
                         *.h++ \
                         *.cs \
                         *.d \
                         *.php \
                         *.php4 \
                         *.php5 \
                         *.phtml \
                         *.inc \
                         *.m \
                         *.markdown \
                         *.md \
                         *.mm \
                         *.dox \
                         *.py \
                         *.pyw \
                         *.f90 \
                         *.f \
                         *.for \
                         *.tcl \
                         *.vhd \
                         *.vhdl \
                         *.ucf \
                         *.qsf \
                         *.as \
                         *.js

# The RECURSIVE tag can be used to specify whether or not subdirectories should
# be searched for input files as well.
# The default value is: NO.

RECURSIVE              = YES

# The EXCLUDE tag can be used to specify files and/or directories that should be
# excluded from the INPUT source files. This way you can easily exclude a
# subdirectory from a directory tree whose root is specified with the INPUT tag.
#
# Note that relative paths are relative to the directory from which doxygen is
# run.

EXCLUDE                =

# The EXCLUDE_SYMLINKS tag can be used to select whether or not files or
# directories that are symbolic links (a Unix file system feature) are excluded
# from the input.
# The default value is: NO.

EXCLUDE_SYMLINKS       = NO

# If the value of the INPUT tag contains directories, you can use the
# EXCLUDE_PATTERNS tag to specify one or more wildcard patterns to exclude
# certain files from those directories.
#
# Note that the wildcards are matched against the file with absolute path, so to
# exclude all test directories for example use the pattern */test/*

EXCLUDE_PATTERNS       = */include/proto/*.h

# The EXCLUDE_SYMBOLS tag can be used to specify one or more symbol names
# (namespaces, classes, functions, etc.) that should be excluded from the
# output. The symbol name can be a fully qualified name, a word, or if the
# wildcard * is used, a substring. Examples: ANamespace, AClass,
# AClass::ANamespace, ANamespace::*Test
#
# Note that the wildcards are matched against the file with absolute path, so to
# exclude all test directories use the pattern */test/*

EXCLUDE_SYMBOLS        = proto

# The EXAMPLE_PATH tag can be used to specify one or more files or directories
# that contain example code fragments that are included (see the \include
# command).

EXAMPLE_PATH           = @CMAKE_CURRENT_SOURCE_DIR@/../examples

# If the value of the EXAMPLE_PATH tag contains directories, you can use the
# EXAMPLE_PATTERNS tag to specify one or more wildcard pattern (like *.cpp and
# *.h) to filter out the source-files in the directories. If left blank all
# files are included.

EXAMPLE_PATTERNS       = *

# If the EXAMPLE_RECURSIVE tag is set to YES then subdirectories will be
# searched for input files to be used with the \include or \dontinclude commands
# irrespective of the value of the RECURSIVE tag.
# The default value is: NO.

EXAMPLE_RECURSIVE      = NO

# The IMAGE_PATH tag can be used to specify one or more files or directories
# that contain images that are to be included in the documentation (see the
# \image command).

IMAGE_PATH             = @CMAKE_CURRENT_SOURCE_DIR@/../../

# The INPUT_FILTER tag can be used to specify a program that doxygen should
# invoke to filter for each input file. Doxygen will invoke the filter program
# by executing (via popen()) the command:
#
# <filter> <input-file>
#
# where <filter> is the value of the INPUT_FILTER tag, and <input-file> is the
# name of an input file. Doxygen will then use the output that the filter
# program writes to standard output. If FILTER_PATTERNS is specified, this tag
# will be ignored.
#
# Note that the filter must not add or remove lines; it is applied before the
# code is scanned, but not when the output code is generated. If lines are added
# or removed, the anchors will not be placed correctly.
#
# Note that for custom extensions or not directly supported extensions you also
# need to set EXTENSION_MAPPING for the extension otherwise the files are not
# properly processed by doxygen.

INPUT_FILTER           =

# The FILTER_PATTERNS tag can be used to specify filters on a per file pattern
# basis. Doxygen will compare the file name with each pattern and apply the
# filter if there is a match. The filters are a list of the form: pattern=filter
# (like *.cpp=my_cpp_filter). See INPUT_FILTER for further information on how
# filters are used. If the FILTER_PATTERNS tag is empty or if none of the
# patterns match the file name, INPUT_FILTER is applied.
#
# Note that for custom extensions or not directly supported extensions you also
# need to set EXTENSION_MAPPING for the extension otherwise the files are not
# properly processed by doxygen.

FILTER_PATTERNS        =

# If the FILTER_SOURCE_FILES tag is set to YES, the input filter (if set using
# INPUT_FILTER) will also be used to filter the input files that are used for
# producing the source files to browse (i.e. when SOURCE_BROWSER is set to YES).
# The default value is: NO.

FILTER_SOURCE_FILES    = NO

# The FILTER_SOURCE_PATTERNS tag can be used to specify source filters per file
# pattern. A pattern will override the setting for FILTER_PATTERN (if any) and
# it is also possible to disable source filtering for a specific pattern using
# *.ext= (so without naming a filter).
# This tag requires that the tag FILTER_SOURCE_FILES is set to YES.

FILTER_SOURCE_PATTERNS =

# If the USE_MDFILE_AS_MAINPAGE tag refers to the name of a markdown file that
# is part of the input, its contents will be placed on the main page
# (index.html). This can be useful if you have a project on for instance GitHub
# and want to reuse the introduction page also for the doxygen output.

USE_MDFILE_AS_MAINPAGE = README.md

#---------------------------------------------------------------------------
# Configuration options related to source browsing
#---------------------------------------------------------------------------

# If the SOURCE_BROWSER tag is set to YES then a list of source files will be
# generated. Documented entities will be cross-referenced with these sources.
#
# Note: To get rid of all source code in the generated output, make sure that
# also VERBATIM_HEADERS is set to NO.
# The default value is: NO.

SOURCE_BROWSER         = NO

# Setting the INLINE_SOURCES tag to YES will include the body of functions,
# classes and enums directly into the documentation.
# The default value is: NO.

INLINE_SOURCES         = NO

# Setting the STRIP_CODE_COMMENTS tag to YES will instruct doxygen to hide any
# special comment blocks from generated source code fragments. Normal C, C++ and
# Fortran comments will always remain visible.
# The default value is: YES.

STRIP_CODE_COMMENTS    = YES

# If the REFERENCED_BY_RELATION tag is set to YES then for each documented
# function all documented functions referencing it will be listed.
# The default value is: NO.

REFERENCED_BY_RELATION = NO

# If the REFERENCES_RELATION tag is set to YES then for each documented function
# all documented entities called/used by that function will be listed.
# The default value is: NO.

REFERENCES_RELATION    = NO

# If the REFERENCES_LINK_SOURCE tag is set to YES and SOURCE_BROWSER tag is set
# to YES then the hyperlinks from functions in REFERENCES_RELATION and
# REFERENCED_BY_RELATION lists will link to the source code. Otherwise they will
# link to the documentation.
# The default value is: YES.

REFERENCES_LINK_SOURCE = YES

# If SOURCE_TOOLTIPS is enabled (the default) then hovering a hyperlink in the
# source code will show a tooltip with additional information such as prototype,
# brief description and links to the definition and documentation. Since this
# will make the HTML file larger and loading of large files a bit slower, you
# can opt to disable this feature.
# The default value is: YES.
# This tag requires that the tag SOURCE_BROWSER is set to YES.

SOURCE_TOOLTIPS        = YES

# If the USE_HTAGS tag is set to YES then the references to source code will
# point to the HTML generated by the htags(1) tool instead of doxygen built-in
# source browser. The htags tool is part of GNU's global source tagging system
# (see http://www.gnu.org/software/global/global.html). You will need version
# 4.8.6 or higher.
#
# To use it do the following:
# - Install the latest version of global
# - Enable SOURCE_BROWSER and USE_HTAGS in the config file
# - Make sure the INPUT points to the root of the source tree
# - Run doxygen as normal
#
# Doxygen will invoke htags (and that will in turn invoke gtags), so these
# tools must be available from the command line (i.e. in the search path).
#
# The result: instead of the source browser generated by doxygen, the links to
# source code will now point to the output of htags.
# The default value is: NO.
# This tag requires that the tag SOURCE_BROWSER is set to YES.

USE_HTAGS              = NO

# If the VERBATIM_HEADERS tag is set the YES then doxygen will generate a
# verbatim copy of the header file for each class for which an include is
# specified. Set to NO to disable this.
# See also: Section \class.
# The default value is: YES.

VERBATIM_HEADERS       = YES

# If the CLANG_ASSISTED_PARSING tag is set to YES then doxygen will use the
# clang parser (see: http://clang.llvm.org/) for more accurate parsing at the
# cost of reduced performance. This can be particularly helpful with template
# rich C++ code for which doxygen's built-in parser lacks the necessary type
# information.
# Note: The availability of this option depends on whether or not doxygen was
# generated with the -Duse-libclang=ON option for CMake.
# The default value is: NO.

CLANG_ASSISTED_PARSING = NO

# If clang assisted parsing is enabled you can provide the compiler with command
# line options that you would normally use when invoking the compiler. Note that
# the include paths will already be set by doxygen for the files and directories
# specified with INPUT and INCLUDE_PATH.
# This tag requires that the tag CLANG_ASSISTED_PARSING is set to YES.

CLANG_OPTIONS          =

#---------------------------------------------------------------------------
# Configuration options related to the alphabetical class index
#---------------------------------------------------------------------------

# If the ALPHABETICAL_INDEX tag is set to YES, an alphabetical index of all
# compounds will be generated. Enable this if the project contains a lot of
# classes, structs, unions or interfaces.
# The default value is: YES.

ALPHABETICAL_INDEX     = YES

# The COLS_IN_ALPHA_INDEX tag can be used to specify the number of columns in
# which the alphabetical index list will be split.
# Minimum value: 1, maximum value: 20, default value: 5.
# This tag requires that the tag ALPHABETICAL_INDEX is set to YES.

COLS_IN_ALPHA_INDEX    = 5

# In case all classes in a project start with a common prefix, all classes will
# be put under the same header in the alphabetical index. The IGNORE_PREFIX tag
# can be used to specify a prefix (or a list of prefixes) that should be ignored
# while generating the index headers.
# This tag requires that the tag ALPHABETICAL_INDEX is set to YES.

IGNORE_PREFIX          =

#---------------------------------------------------------------------------
# Configuration options related to the HTML output
#---------------------------------------------------------------------------

# If the GENERATE_HTML tag is set to YES, doxygen will generate HTML output
# The default value is: YES.

GENERATE_HTML          = YES

# The HTML_OUTPUT tag is used to specify where the HTML docs will be put. If a
# relative path is entered the value of OUTPUT_DIRECTORY will be put in front of
# it.
# The default directory is: html.
# This tag requires that the tag GENERATE_HTML is set to YES.

HTML_OUTPUT            = html

# The HTML_FILE_EXTENSION tag can be used to specify the file extension for each
# generated HTML page (for example: .htm, .php, .asp).
# The default value is: .html.
# This tag requires that the tag GENERATE_HTML is set to YES.

HTML_FILE_EXTENSION    = .html

# The HTML_HEADER tag can be used to specify a user-defined HTML header file for
# each generated HTML page. If the tag is left blank doxygen will generate a
# standard header.
#
# To get valid HTML the header file that includes any scripts and style sheets
# that doxygen needs, which is dependent on the configuration options used (e.g.
# the setting GENERATE_TREEVIEW). It is highly recommended to start with a
# default header using
# doxygen -w html new_header.html new_footer.html new_stylesheet.css
# YourConfigFile
# and then modify the file new_header.html. See also section "Doxygen usage"
# for information on how to generate the default header that doxygen normally
# uses.
# Note: The header is subject to change so you typically have to regenerate the
# default header when upgrading to a newer version of doxygen. For a description
# of the possible markers and block names see the documentation.
# This tag requires that the tag GENERATE_HTML is set to YES.

HTML_HEADER            =

# The HTML_FOOTER tag can be used to specify a user-defined HTML footer for each
# generated HTML page. If the tag is left blank doxygen will generate a standard
# footer. See HTML_HEADER for more information on how to generate a default
# footer and what special commands can be used inside the footer. See also
# section "Doxygen usage" for information on how to generate the default footer
# that doxygen normally uses.
# This tag requires that the tag GENERATE_HTML is set to YES.

HTML_FOOTER            =

# The HTML_STYLESHEET tag can be used to specify a user-defined cascading style
# sheet that is used by each HTML page. It can be used to fine-tune the look of
# the HTML output. If left blank doxygen will generate a default style sheet.
# See also section "Doxygen usage" for information on how to generate the style
# sheet that doxygen normally uses.
# Note: It is recommended to use HTML_EXTRA_STYLESHEET instead of this tag, as
# it is more robust and this tag (HTML_STYLESHEET) will in the future become
# obsolete.
# This tag requires that the tag GENERATE_HTML is set to YES.

HTML_STYLESHEET        =

# The HTML_EXTRA_STYLESHEET tag can be used to specify additional user-defined
# cascading style sheets that are included after the standard style sheets
# created by doxygen. Using this option one can overrule certain style aspects.
# This is preferred over using HTML_STYLESHEET since it does not replace the
# standard style sheet and is therefore more robust against future updates.
# Doxygen will copy the style sheet files to the output directory.
# Note: The order of the extra style sheet files is of importance (e.g. the last
# style sheet in the list overrules the setting of the previous ones in the
# list). For an example see the documentation.
# This tag requires that the tag GENERATE_HTML is set to YES.

HTML_EXTRA_STYLESHEET  =

# The HTML_EXTRA_FILES tag can be used to specify one or more extra images or
# other source files which should be copied to the HTML output directory. Note
# that these files will be copied to the base HTML output directory. Use the
# $relpath^ marker in the HTML_HEADER and/or HTML_FOOTER files to load these
# files. In the HTML_STYLESHEET file, use the file name only. Also note that the
# files will be copied as-is; there are no commands or markers available.
# This tag requires that the tag GENERATE_HTML is set to YES.

HTML_EXTRA_FILES       =

# The HTML_COLORSTYLE_HUE tag controls the color of the HTML output. Doxygen
# will adjust the colors in the style sheet and background images according to
# this color. Hue is specified as an angle on a colorwheel, see
# http://en.wikipedia.org/wiki/Hue for more information. For instance the value
# 0 represents red, 60 is yellow, 120 is green, 180 is cyan, 240 is blue, 300
# purple, and 360 is red again.
# Minimum value: 0, maximum value: 359, default value: 220.
# This tag requires that the tag GENERATE_HTML is set to YES.

HTML_COLORSTYLE_HUE    = 220

# The HTML_COLORSTYLE_SAT tag controls the purity (or saturation) of the colors
# in the HTML output. For a value of 0 the output will use grayscales only. A
# value of 255 will produce the most vivid colors.
# Minimum value: 0, maximum value: 255, default value: 100.
# This tag requires that the tag GENERATE_HTML is set to YES.

HTML_COLORSTYLE_SAT    = 100

# The HTML_COLORSTYLE_GAMMA tag controls the gamma correction applied to the
# luminance component of the colors in the HTML output. Values below 100
# gradually make the output lighter, whereas values above 100 make the output
# darker. The value divided by 100 is the actual gamma applied, so 80 represents
# a gamma of 0.8, The value 220 represents a gamma of 2.2, and 100 does not
# change the gamma.
# Minimum value: 40, maximum value: 240, default value: 80.
# This tag requires that the tag GENERATE_HTML is set to YES.

HTML_COLORSTYLE_GAMMA  = 80

# If the HTML_TIMESTAMP tag is set to YES then the footer of each generated HTML
# page will contain the date and time when the page was generated. Setting this
# to YES can help to show when doxygen was last run and thus if the
# documentation is up to date.
# The default value is: NO.
# This tag requires that the tag GENERATE_HTML is set to YES.

HTML_TIMESTAMP         = NO

# If the HTML_DYNAMIC_SECTIONS tag is set to YES then the generated HTML
# documentation will contain sections that can be hidden and shown after the
# page has loaded.
# The default value is: NO.
# This tag requires that the tag GENERATE_HTML is set to YES.

HTML_DYNAMIC_SECTIONS  = NO

# With HTML_INDEX_NUM_ENTRIES one can control the preferred number of entries
# shown in the various tree structured indices initially; the user can expand
# and collapse entries dynamically later on. Doxygen will expand the tree to
# such a level that at most the specified number of entries are visible (unless
# a fully collapsed tree already exceeds this amount). So setting the number of
# entries 1 will produce a full collapsed tree by default. 0 is a special value
# representing an infinite number of entries and will result in a full expanded
# tree by default.
# Minimum value: 0, maximum value: 9999, default value: 100.
# This tag requires that the tag GENERATE_HTML is set to YES.

HTML_INDEX_NUM_ENTRIES = 100

# If the GENERATE_DOCSET tag is set to YES, additional index files will be
# generated that can be used as input for Apple's Xcode 3 integrated development
# environment (see: http://developer.apple.com/tools/xcode/), introduced with
# OSX 10.5 (Leopard). To create a documentation set, doxygen will generate a
# Makefile in the HTML output directory. Running make will produce the docset in
# that directory and running make install will install the docset in
# ~/Library/Developer/Shared/Documentation/DocSets so that Xcode will find it at
# startup. See http://developer.apple.com/tools/creatingdocsetswithdoxygen.html
# for more information.
# The default value is: NO.
# This tag requires that the tag GENERATE_HTML is set to YES.

GENERATE_DOCSET        = NO

# This tag determines the name of the docset feed. A documentation feed provides
# an umbrella under which multiple documentation sets from a single provider
# (such as a company or product suite) can be grouped.
# The default value is: Doxygen generated docs.
# This tag requires that the tag GENERATE_DOCSET is set to YES.

DOCSET_FEEDNAME        = "Doxygen generated docs"

# This tag specifies a string that should uniquely identify the documentation
# set bundle. This should be a reverse domain-name style string, e.g.
# com.mycompany.MyDocSet. Doxygen will append .docset to the name.
# The default value is: org.doxygen.Project.
# This tag requires that the tag GENERATE_DOCSET is set to YES.

DOCSET_BUNDLE_ID       = org.doxygen.Project

# The DOCSET_PUBLISHER_ID tag specifies a string that should uniquely identify
# the documentation publisher. This should be a reverse domain-name style
# string, e.g. com.mycompany.MyDocSet.documentation.
# The default value is: org.doxygen.Publisher.
# This tag requires that the tag GENERATE_DOCSET is set to YES.

DOCSET_PUBLISHER_ID    = org.doxygen.Publisher

# The DOCSET_PUBLISHER_NAME tag identifies the documentation publisher.
# The default value is: Publisher.
# This tag requires that the tag GENERATE_DOCSET is set to YES.

DOCSET_PUBLISHER_NAME  = Publisher

# If the GENERATE_HTMLHELP tag is set to YES then doxygen generates three
# additional HTML index files: index.hhp, index.hhc, and index.hhk. The
# index.hhp is a project file that can be read by Microsoft's HTML Help Workshop
# (see: http://www.microsoft.com/en-us/download/details.aspx?id=21138) on
# Windows.
#
# The HTML Help Workshop contains a compiler that can convert all HTML output
# generated by doxygen into a single compiled HTML file (.chm). Compiled HTML
# files are now used as the Windows 98 help format, and will replace the old
# Windows help format (.hlp) on all Windows platforms in the future. Compressed
# HTML files also contain an index, a table of contents, and you can search for
# words in the documentation. The HTML workshop also contains a viewer for
# compressed HTML files.
# The default value is: NO.
# This tag requires that the tag GENERATE_HTML is set to YES.

GENERATE_HTMLHELP      = NO

# The CHM_FILE tag can be used to specify the file name of the resulting .chm
# file. You can add a path in front of the file if the result should not be
# written to the html output directory.
# This tag requires that the tag GENERATE_HTMLHELP is set to YES.

CHM_FILE               =

# The HHC_LOCATION tag can be used to specify the location (absolute path
# including file name) of the HTML help compiler (hhc.exe). If non-empty,
# doxygen will try to run the HTML help compiler on the generated index.hhp.
# The file has to be specified with full path.
# This tag requires that the tag GENERATE_HTMLHELP is set to YES.

HHC_LOCATION           =

# The GENERATE_CHI flag controls if a separate .chi index file is generated
# (YES) or that it should be included in the master .chm file (NO).
# The default value is: NO.
# This tag requires that the tag GENERATE_HTMLHELP is set to YES.

GENERATE_CHI           = NO

# The CHM_INDEX_ENCODING is used to encode HtmlHelp index (hhk), content (hhc)
# and project file content.
# This tag requires that the tag GENERATE_HTMLHELP is set to YES.

CHM_INDEX_ENCODING     =

# The BINARY_TOC flag controls whether a binary table of contents is generated
# (YES) or a normal table of contents (NO) in the .chm file. Furthermore it
# enables the Previous and Next buttons.
# The default value is: NO.
# This tag requires that the tag GENERATE_HTMLHELP is set to YES.

BINARY_TOC             = NO

# The TOC_EXPAND flag can be set to YES to add extra items for group members to
# the table of contents of the HTML help documentation and to the tree view.
# The default value is: NO.
# This tag requires that the tag GENERATE_HTMLHELP is set to YES.

TOC_EXPAND             = NO

# If the GENERATE_QHP tag is set to YES and both QHP_NAMESPACE and
# QHP_VIRTUAL_FOLDER are set, an additional index file will be generated that
# can be used as input for Qt's qhelpgenerator to generate a Qt Compressed Help
# (.qch) of the generated HTML documentation.
# The default value is: NO.
# This tag requires that the tag GENERATE_HTML is set to YES.

GENERATE_QHP           = NO

# If the QHG_LOCATION tag is specified, the QCH_FILE tag can be used to specify
# the file name of the resulting .qch file. The path specified is relative to
# the HTML output folder.
# This tag requires that the tag GENERATE_QHP is set to YES.

QCH_FILE               =

# The QHP_NAMESPACE tag specifies the namespace to use when generating Qt Help
# Project output. For more information please see Qt Help Project / Namespace
# (see: http://qt-project.org/doc/qt-4.8/qthelpproject.html#namespace).
# The default value is: org.doxygen.Project.
# This tag requires that the tag GENERATE_QHP is set to YES.

QHP_NAMESPACE          = org.doxygen.Project

# The QHP_VIRTUAL_FOLDER tag specifies the namespace to use when generating Qt
# Help Project output. For more information please see Qt Help Project / Virtual
# Folders (see: http://qt-project.org/doc/qt-4.8/qthelpproject.html#virtual-
# folders).
# The default value is: doc.
# This tag requires that the tag GENERATE_QHP is set to YES.

QHP_VIRTUAL_FOLDER     = doc

# If the QHP_CUST_FILTER_NAME tag is set, it specifies the name of a custom
# filter to add. For more information please see Qt Help Project / Custom
# Filters (see: http://qt-project.org/doc/qt-4.8/qthelpproject.html#custom-
# filters).
# This tag requires that the tag GENERATE_QHP is set to YES.

QHP_CUST_FILTER_NAME   =

# The QHP_CUST_FILTER_ATTRS tag specifies the list of the attributes of the
# custom filter to add. For more information please see Qt Help Project / Custom
# Filters (see: http://qt-project.org/doc/qt-4.8/qthelpproject.html#custom-
# filters).
# This tag requires that the tag GENERATE_QHP is set to YES.

QHP_CUST_FILTER_ATTRS  =

# The QHP_SECT_FILTER_ATTRS tag specifies the list of the attributes this
# project's filter section matches. Qt Help Project / Filter Attributes (see:
# http://qt-project.org/doc/qt-4.8/qthelpproject.html#filter-attributes).
# This tag requires that the tag GENERATE_QHP is set to YES.

QHP_SECT_FILTER_ATTRS  =

# The QHG_LOCATION tag can be used to specify the location of Qt's
# qhelpgenerator. If non-empty doxygen will try to run qhelpgenerator on the
# generated .qhp file.
# This tag requires that the tag GENERATE_QHP is set to YES.

QHG_LOCATION           =

# If the GENERATE_ECLIPSEHELP tag is set to YES, additional index files will be
# generated, together with the HTML files, they form an Eclipse help plugin. To
# install this plugin and make it available under the help contents menu in
# Eclipse, the contents of the directory containing the HTML and XML files needs
# to be copied into the plugins directory of eclipse. The name of the directory
# within the plugins directory should be the same as the ECLIPSE_DOC_ID value.
# After copying Eclipse needs to be restarted before the help appears.
# The default value is: NO.
# This tag requires that the tag GENERATE_HTML is set to YES.

GENERATE_ECLIPSEHELP   = NO

# A unique identifier for the Eclipse help plugin. When installing the plugin
# the directory name containing the HTML and XML files should also have this
# name. Each documentation set should have its own identifier.
# The default value is: org.doxygen.Project.
# This tag requires that the tag GENERATE_ECLIPSEHELP is set to YES.

ECLIPSE_DOC_ID         = org.doxygen.Project

# If you want full control over the layout of the generated HTML pages it might
# be necessary to disable the index and replace it with your own. The
# DISABLE_INDEX tag can be used to turn on/off the condensed index (tabs) at top
# of each HTML page. A value of NO enables the index and the value YES disables
# it. Since the tabs in the index contain the same information as the navigation
# tree, you can set this option to YES if you also set GENERATE_TREEVIEW to YES.
# The default value is: NO.
# This tag requires that the tag GENERATE_HTML is set to YES.

DISABLE_INDEX          = NO

# The GENERATE_TREEVIEW tag is used to specify whether a tree-like index
# structure should be generated to display hierarchical information. If the tag
# value is set to YES, a side panel will be generated containing a tree-like
# index structure (just like the one that is generated for HTML Help). For this
# to work a browser that supports JavaScript, DHTML, CSS and frames is required
# (i.e. any modern browser). Windows users are probably better off using the
# HTML help feature. Via custom style sheets (see HTML_EXTRA_STYLESHEET) one can
# further fine-tune the look of the index. As an example, the default style
# sheet generated by doxygen has an example that shows how to put an image at
# the root of the tree instead of the PROJECT_NAME. Since the tree basically has
# the same information as the tab index, you could consider setting
# DISABLE_INDEX to YES when enabling this option.
# The default value is: NO.
# This tag requires that the tag GENERATE_HTML is set to YES.

GENERATE_TREEVIEW      = NO

# The ENUM_VALUES_PER_LINE tag can be used to set the number of enum values that
# doxygen will group on one line in the generated HTML documentation.
#
# Note that a value of 0 will completely suppress the enum values from appearing
# in the overview section.
# Minimum value: 0, maximum value: 20, default value: 4.
# This tag requires that the tag GENERATE_HTML is set to YES.

ENUM_VALUES_PER_LINE   = 4

# If the treeview is enabled (see GENERATE_TREEVIEW) then this tag can be used
# to set the initial width (in pixels) of the frame in which the tree is shown.
# Minimum value: 0, maximum value: 1500, default value: 250.
# This tag requires that the tag GENERATE_HTML is set to YES.

TREEVIEW_WIDTH         = 250

# If the EXT_LINKS_IN_WINDOW option is set to YES, doxygen will open links to
# external symbols imported via tag files in a separate window.
# The default value is: NO.
# This tag requires that the tag GENERATE_HTML is set to YES.

EXT_LINKS_IN_WINDOW    = NO

# Use this tag to change the font size of LaTeX formulas included as images in
# the HTML documentation. When you change the font size after a successful
# doxygen run you need to manually remove any form_*.png images from the HTML
# output directory to force them to be regenerated.
# Minimum value: 8, maximum value: 50, default value: 10.
# This tag requires that the tag GENERATE_HTML is set to YES.

FORMULA_FONTSIZE       = 10

# Use the FORMULA_TRANPARENT tag to determine whether or not the images
# generated for formulas are transparent PNGs. Transparent PNGs are not
# supported properly for IE 6.0, but are supported on all modern browsers.
#
# Note that when changing this option you need to delete any form_*.png files in
# the HTML output directory before the changes have effect.
# The default value is: YES.
# This tag requires that the tag GENERATE_HTML is set to YES.

FORMULA_TRANSPARENT    = YES

# Enable the USE_MATHJAX option to render LaTeX formulas using MathJax (see
# http://www.mathjax.org) which uses client side Javascript for the rendering
# instead of using pre-rendered bitmaps. Use this if you do not have LaTeX
# installed or if you want to formulas look prettier in the HTML output. When
# enabled you may also need to install MathJax separately and configure the path
# to it using the MATHJAX_RELPATH option.
# The default value is: NO.
# This tag requires that the tag GENERATE_HTML is set to YES.

USE_MATHJAX            = NO

# When MathJax is enabled you can set the default output format to be used for
# the MathJax output. See the MathJax site (see:
# http://docs.mathjax.org/en/latest/output.html) for more details.
# Possible values are: HTML-CSS (which is slower, but has the best
# compatibility), NativeMML (i.e. MathML) and SVG.
# The default value is: HTML-CSS.
# This tag requires that the tag USE_MATHJAX is set to YES.

MATHJAX_FORMAT         = HTML-CSS

# When MathJax is enabled you need to specify the location relative to the HTML
# output directory using the MATHJAX_RELPATH option. The destination directory
# should contain the MathJax.js script. For instance, if the mathjax directory
# is located at the same level as the HTML output directory, then
# MATHJAX_RELPATH should be ../mathjax. The default value points to the MathJax
# Content Delivery Network so you can quickly see the result without installing
# MathJax. However, it is strongly recommended to install a local copy of
# MathJax from http://www.mathjax.org before deployment.
# The default value is: http://cdn.mathjax.org/mathjax/latest.
# This tag requires that the tag USE_MATHJAX is set to YES.

MATHJAX_RELPATH        = http://cdn.mathjax.org/mathjax/latest

# The MATHJAX_EXTENSIONS tag can be used to specify one or more MathJax
# extension names that should be enabled during MathJax rendering. For example
# MATHJAX_EXTENSIONS = TeX/AMSmath TeX/AMSsymbols
# This tag requires that the tag USE_MATHJAX is set to YES.

MATHJAX_EXTENSIONS     =

# The MATHJAX_CODEFILE tag can be used to specify a file with javascript pieces
# of code that will be used on startup of the MathJax code. See the MathJax site
# (see: http://docs.mathjax.org/en/latest/output.html) for more details. For an
# example see the documentation.
# This tag requires that the tag USE_MATHJAX is set to YES.

MATHJAX_CODEFILE       =

# When the SEARCHENGINE tag is enabled doxygen will generate a search box for
# the HTML output. The underlying search engine uses javascript and DHTML and
# should work on any modern browser. Note that when using HTML help
# (GENERATE_HTMLHELP), Qt help (GENERATE_QHP), or docsets (GENERATE_DOCSET)
# there is already a search function so this one should typically be disabled.
# For large projects the javascript based search engine can be slow, then
# enabling SERVER_BASED_SEARCH may provide a better solution. It is possible to
# search using the keyboard; to jump to the search box use <access key> + S
# (what the <access key> is depends on the OS and browser, but it is typically
# <CTRL>, <ALT>/<option>, or both). Inside the search box use the <cursor down
# key> to jump into the search results window, the results can be navigated
# using the <cursor keys>. Press <Enter> to select an item or <escape> to cancel
# the search. The filter options can be selected when the cursor is inside the
# search box by pressing <Shift>+<cursor down>. Also here use the <cursor keys>
# to select a filter and <Enter> or <escape> to activate or cancel the filter
# option.
# The default value is: YES.
# This tag requires that the tag GENERATE_HTML is set to YES.

SEARCHENGINE           = YES

# When the SERVER_BASED_SEARCH tag is enabled the search engine will be
# implemented using a web server instead of a web client using Javascript. There
# are two flavors of web server based searching depending on the EXTERNAL_SEARCH
# setting. When disabled, doxygen will generate a PHP script for searching and
# an index file used by the script. When EXTERNAL_SEARCH is enabled the indexing
# and searching needs to be provided by external tools. See the section
# "External Indexing and Searching" for details.
# The default value is: NO.
# This tag requires that the tag SEARCHENGINE is set to YES.

SERVER_BASED_SEARCH    = NO

# When EXTERNAL_SEARCH tag is enabled doxygen will no longer generate the PHP
# script for searching. Instead the search results are written to an XML file
# which needs to be processed by an external indexer. Doxygen will invoke an
# external search engine pointed to by the SEARCHENGINE_URL option to obtain the
# search results.
#
# Doxygen ships with an example indexer (doxyindexer) and search engine
# (doxysearch.cgi) which are based on the open source search engine library
# Xapian (see: http://xapian.org/).
#
# See the section "External Indexing and Searching" for details.
# The default value is: NO.
# This tag requires that the tag SEARCHENGINE is set to YES.

EXTERNAL_SEARCH        = NO

# The SEARCHENGINE_URL should point to a search engine hosted by a web server
# which will return the search results when EXTERNAL_SEARCH is enabled.
#
# Doxygen ships with an example indexer (doxyindexer) and search engine
# (doxysearch.cgi) which are based on the open source search engine library
# Xapian (see: http://xapian.org/). See the section "External Indexing and
# Searching" for details.
# This tag requires that the tag SEARCHENGINE is set to YES.

SEARCHENGINE_URL       =

# When SERVER_BASED_SEARCH and EXTERNAL_SEARCH are both enabled the unindexed
# search data is written to a file for indexing by an external tool. With the
# SEARCHDATA_FILE tag the name of this file can be specified.
# The default file is: searchdata.xml.
# This tag requires that the tag SEARCHENGINE is set to YES.

SEARCHDATA_FILE        = searchdata.xml

# When SERVER_BASED_SEARCH and EXTERNAL_SEARCH are both enabled the
# EXTERNAL_SEARCH_ID tag can be used as an identifier for the project. This is
# useful in combination with EXTRA_SEARCH_MAPPINGS to search through multiple
# projects and redirect the results back to the right project.
# This tag requires that the tag SEARCHENGINE is set to YES.

EXTERNAL_SEARCH_ID     =

# The EXTRA_SEARCH_MAPPINGS tag can be used to enable searching through doxygen
# projects other than the one defined by this configuration file, but that are
# all added to the same external search index. Each project needs to have a
# unique id set via EXTERNAL_SEARCH_ID. The search mapping then maps the id of
# to a relative location where the documentation can be found. The format is:
# EXTRA_SEARCH_MAPPINGS = tagname1=loc1 tagname2=loc2 ...
# This tag requires that the tag SEARCHENGINE is set to YES.

EXTRA_SEARCH_MAPPINGS  =

#---------------------------------------------------------------------------
# Configuration options related to the LaTeX output
#---------------------------------------------------------------------------

# If the GENERATE_LATEX tag is set to YES, doxygen will generate LaTeX output.
# The default value is: YES.

GENERATE_LATEX         = NO

# The LATEX_OUTPUT tag is used to specify where the LaTeX docs will be put. If a
# relative path is entered the value of OUTPUT_DIRECTORY will be put in front of
# it.
# The default directory is: latex.
# This tag requires that the tag GENERATE_LATEX is set to YES.

LATEX_OUTPUT           = latex

# The LATEX_CMD_NAME tag can be used to specify the LaTeX command name to be
# invoked.
#
# Note that when enabling USE_PDFLATEX this option is only used for generating
# bitmaps for formulas in the HTML output, but not in the Makefile that is
# written to the output directory.
# The default file is: latex.
# This tag requires that the tag GENERATE_LATEX is set to YES.

LATEX_CMD_NAME         = latex

# The MAKEINDEX_CMD_NAME tag can be used to specify the command name to generate
# index for LaTeX.
# The default file is: makeindex.
# This tag requires that the tag GENERATE_LATEX is set to YES.

MAKEINDEX_CMD_NAME     = makeindex

# If the COMPACT_LATEX tag is set to YES, doxygen generates more compact LaTeX
# documents. This may be useful for small projects and may help to save some
# trees in general.
# The default value is: NO.
# This tag requires that the tag GENERATE_LATEX is set to YES.

COMPACT_LATEX          = NO

# The PAPER_TYPE tag can be used to set the paper type that is used by the
# printer.
# Possible values are: a4 (210 x 297 mm), letter (8.5 x 11 inches), legal (8.5 x
# 14 inches) and executive (7.25 x 10.5 inches).
# The default value is: a4.
# This tag requires that the tag GENERATE_LATEX is set to YES.

PAPER_TYPE             = a4

# The EXTRA_PACKAGES tag can be used to specify one or more LaTeX package names
# that should be included in the LaTeX output. The package can be specified just
# by its name or with the correct syntax as to be used with the LaTeX
# \usepackage command. To get the times font for instance you can specify :
# EXTRA_PACKAGES=times or EXTRA_PACKAGES={times}
# To use the option intlimits with the amsmath package you can specify:
# EXTRA_PACKAGES=[intlimits]{amsmath}
# If left blank no extra packages will be included.
# This tag requires that the tag GENERATE_LATEX is set to YES.

EXTRA_PACKAGES         =

# The LATEX_HEADER tag can be used to specify a personal LaTeX header for the
# generated LaTeX document. The header should contain everything until the first
# chapter. If it is left blank doxygen will generate a standard header. See
# section "Doxygen usage" for information on how to let doxygen write the
# default header to a separate file.
#
# Note: Only use a user-defined header if you know what you are doing! The
# following commands have a special meaning inside the header: $title,
# $datetime, $date, $doxygenversion, $projectname, $projectnumber,
# $projectbrief, $projectlogo. Doxygen will replace $title with the empty
# string, for the replacement values of the other commands the user is referred
# to HTML_HEADER.
# This tag requires that the tag GENERATE_LATEX is set to YES.

LATEX_HEADER           =

# The LATEX_FOOTER tag can be used to specify a personal LaTeX footer for the
# generated LaTeX document. The footer should contain everything after the last
# chapter. If it is left blank doxygen will generate a standard footer. See
# LATEX_HEADER for more information on how to generate a default footer and what
# special commands can be used inside the footer.
#
# Note: Only use a user-defined footer if you know what you are doing!
# This tag requires that the tag GENERATE_LATEX is set to YES.

LATEX_FOOTER           =

# The LATEX_EXTRA_STYLESHEET tag can be used to specify additional user-defined
# LaTeX style sheets that are included after the standard style sheets created
# by doxygen. Using this option one can overrule certain style aspects. Doxygen
# will copy the style sheet files to the output directory.
# Note: The order of the extra style sheet files is of importance (e.g. the last
# style sheet in the list overrules the setting of the previous ones in the
# list).
# This tag requires that the tag GENERATE_LATEX is set to YES.

LATEX_EXTRA_STYLESHEET =

# The LATEX_EXTRA_FILES tag can be used to specify one or more extra images or
# other source files which should be copied to the LATEX_OUTPUT output
# directory. Note that the files will be copied as-is; there are no commands or
# markers available.
# This tag requires that the tag GENERATE_LATEX is set to YES.

LATEX_EXTRA_FILES      =

# If the PDF_HYPERLINKS tag is set to YES, the LaTeX that is generated is
# prepared for conversion to PDF (using ps2pdf or pdflatex). The PDF file will
# contain links (just like the HTML output) instead of page references. This
# makes the output suitable for online browsing using a PDF viewer.
# The default value is: YES.
# This tag requires that the tag GENERATE_LATEX is set to YES.

PDF_HYPERLINKS         = YES

# If the USE_PDFLATEX tag is set to YES, doxygen will use pdflatex to generate
# the PDF file directly from the LaTeX files. Set this option to YES, to get a
# higher quality PDF documentation.
# The default value is: YES.
# This tag requires that the tag GENERATE_LATEX is set to YES.

USE_PDFLATEX           = YES

# If the LATEX_BATCHMODE tag is set to YES, doxygen will add the \batchmode
# command to the generated LaTeX files. This will instruct LaTeX to keep running
# if errors occur, instead of asking the user for help. This option is also used
# when generating formulas in HTML.
# The default value is: NO.
# This tag requires that the tag GENERATE_LATEX is set to YES.

LATEX_BATCHMODE        = NO

# If the LATEX_HIDE_INDICES tag is set to YES then doxygen will not include the
# index chapters (such as File Index, Compound Index, etc.) in the output.
# The default value is: NO.
# This tag requires that the tag GENERATE_LATEX is set to YES.

LATEX_HIDE_INDICES     = NO

# If the LATEX_SOURCE_CODE tag is set to YES then doxygen will include source
# code with syntax highlighting in the LaTeX output.
#
# Note that which sources are shown also depends on other settings such as
# SOURCE_BROWSER.
# The default value is: NO.
# This tag requires that the tag GENERATE_LATEX is set to YES.

LATEX_SOURCE_CODE      = NO

# The LATEX_BIB_STYLE tag can be used to specify the style to use for the
# bibliography, e.g. plainnat, or ieeetr. See
# http://en.wikipedia.org/wiki/BibTeX and \cite for more info.
# The default value is: plain.
# This tag requires that the tag GENERATE_LATEX is set to YES.

LATEX_BIB_STYLE        = plain

# If the LATEX_TIMESTAMP tag is set to YES then the footer of each generated
# page will contain the date and time when the page was generated. Setting this
# to NO can help when comparing the output of multiple runs.
# The default value is: NO.
# This tag requires that the tag GENERATE_LATEX is set to YES.

LATEX_TIMESTAMP        = NO

#---------------------------------------------------------------------------
# Configuration options related to the RTF output
#---------------------------------------------------------------------------

# If the GENERATE_RTF tag is set to YES, doxygen will generate RTF output. The
# RTF output is optimized for Word 97 and may not look too pretty with other RTF
# readers/editors.
# The default value is: NO.

GENERATE_RTF           = NO

# The RTF_OUTPUT tag is used to specify where the RTF docs will be put. If a
# relative path is entered the value of OUTPUT_DIRECTORY will be put in front of
# it.
# The default directory is: rtf.
# This tag requires that the tag GENERATE_RTF is set to YES.

RTF_OUTPUT             = rtf

# If the COMPACT_RTF tag is set to YES, doxygen generates more compact RTF
# documents. This may be useful for small projects and may help to save some
# trees in general.
# The default value is: NO.
# This tag requires that the tag GENERATE_RTF is set to YES.

COMPACT_RTF            = NO

# If the RTF_HYPERLINKS tag is set to YES, the RTF that is generated will
# contain hyperlink fields. The RTF file will contain links (just like the HTML
# output) instead of page references. This makes the output suitable for online
# browsing using Word or some other Word compatible readers that support those
# fields.
#
# Note: WordPad (write) and others do not support links.
# The default value is: NO.
# This tag requires that the tag GENERATE_RTF is set to YES.

RTF_HYPERLINKS         = NO

# Load stylesheet definitions from file. Syntax is similar to doxygen's config
# file, i.e. a series of assignments. You only have to provide replacements,
# missing definitions are set to their default value.
#
# See also section "Doxygen usage" for information on how to generate the
# default style sheet that doxygen normally uses.
# This tag requires that the tag GENERATE_RTF is set to YES.

RTF_STYLESHEET_FILE    =

# Set optional variables used in the generation of an RTF document. Syntax is
# similar to doxygen's config file. A template extensions file can be generated
# using doxygen -e rtf extensionFile.
# This tag requires that the tag GENERATE_RTF is set to YES.

RTF_EXTENSIONS_FILE    =

# If the RTF_SOURCE_CODE tag is set to YES then doxygen will include source code
# with syntax highlighting in the RTF output.
#
# Note that which sources are shown also depends on other settings such as
# SOURCE_BROWSER.
# The default value is: NO.
# This tag requires that the tag GENERATE_RTF is set to YES.

RTF_SOURCE_CODE        = NO

#---------------------------------------------------------------------------
# Configuration options related to the man page output
#---------------------------------------------------------------------------

# If the GENERATE_MAN tag is set to YES, doxygen will generate man pages for
# classes and files.
# The default value is: NO.

GENERATE_MAN           = NO

# The MAN_OUTPUT tag is used to specify where the man pages will be put. If a
# relative path is entered the value of OUTPUT_DIRECTORY will be put in front of
# it. A directory man3 will be created inside the directory specified by
# MAN_OUTPUT.
# The default directory is: man.
# This tag requires that the tag GENERATE_MAN is set to YES.

MAN_OUTPUT             = man

# The MAN_EXTENSION tag determines the extension that is added to the generated
# man pages. In case the manual section does not start with a number, the number
# 3 is prepended. The dot (.) at the beginning of the MAN_EXTENSION tag is
# optional.
# The default value is: .3.
# This tag requires that the tag GENERATE_MAN is set to YES.

MAN_EXTENSION          = .3

# The MAN_SUBDIR tag determines the name of the directory created within
# MAN_OUTPUT in which the man pages are placed. If defaults to man followed by
# MAN_EXTENSION with the initial . removed.
# This tag requires that the tag GENERATE_MAN is set to YES.

MAN_SUBDIR             =

# If the MAN_LINKS tag is set to YES and doxygen generates man output, then it
# will generate one additional man file for each entity documented in the real
# man page(s). These additional files only source the real man page, but without
# them the man command would be unable to find the correct page.
# The default value is: NO.
# This tag requires that the tag GENERATE_MAN is set to YES.

MAN_LINKS              = NO

#---------------------------------------------------------------------------
# Configuration options related to the XML output
#---------------------------------------------------------------------------

# If the GENERATE_XML tag is set to YES, doxygen will generate an XML file that
# captures the structure of the code including all documentation.
# The default value is: NO.

GENERATE_XML           = NO

# The XML_OUTPUT tag is used to specify where the XML pages will be put. If a
# relative path is entered the value of OUTPUT_DIRECTORY will be put in front of
# it.
# The default directory is: xml.
# This tag requires that the tag GENERATE_XML is set to YES.

XML_OUTPUT             = xml

# If the XML_PROGRAMLISTING tag is set to YES, doxygen will dump the program
# listings (including syntax highlighting and cross-referencing information) to
# the XML output. Note that enabling this will significantly increase the size
# of the XML output.
# The default value is: YES.
# This tag requires that the tag GENERATE_XML is set to YES.

XML_PROGRAMLISTING     = YES

#---------------------------------------------------------------------------
# Configuration options related to the DOCBOOK output
#---------------------------------------------------------------------------

# If the GENERATE_DOCBOOK tag is set to YES, doxygen will generate Docbook files
# that can be used to generate PDF.
# The default value is: NO.

GENERATE_DOCBOOK       = NO

# The DOCBOOK_OUTPUT tag is used to specify where the Docbook pages will be put.
# If a relative path is entered the value of OUTPUT_DIRECTORY will be put in
# front of it.
# The default directory is: docbook.
# This tag requires that the tag GENERATE_DOCBOOK is set to YES.

DOCBOOK_OUTPUT         = docbook

# If the DOCBOOK_PROGRAMLISTING tag is set to YES, doxygen will include the
# program listings (including syntax highlighting and cross-referencing
# information) to the DOCBOOK output. Note that enabling this will significantly
# increase the size of the DOCBOOK output.
# The default value is: NO.
# This tag requires that the tag GENERATE_DOCBOOK is set to YES.

DOCBOOK_PROGRAMLISTING = NO

#---------------------------------------------------------------------------
# Configuration options for the AutoGen Definitions output
#---------------------------------------------------------------------------

# If the GENERATE_AUTOGEN_DEF tag is set to YES, doxygen will generate an
# AutoGen Definitions (see http://autogen.sf.net) file that captures the
# structure of the code including all documentation. Note that this feature is
# still experimental and incomplete at the moment.
# The default value is: NO.

GENERATE_AUTOGEN_DEF   = NO

#---------------------------------------------------------------------------
# Configuration options related to the Perl module output
#---------------------------------------------------------------------------

# If the GENERATE_PERLMOD tag is set to YES, doxygen will generate a Perl module
# file that captures the structure of the code including all documentation.
#
# Note that this feature is still experimental and incomplete at the moment.
# The default value is: NO.

GENERATE_PERLMOD       = NO

# If the PERLMOD_LATEX tag is set to YES, doxygen will generate the necessary
# Makefile rules, Perl scripts and LaTeX code to be able to generate PDF and DVI
# output from the Perl module output.
# The default value is: NO.
# This tag requires that the tag GENERATE_PERLMOD is set to YES.

PERLMOD_LATEX          = NO

# If the PERLMOD_PRETTY tag is set to YES, the Perl module output will be nicely
# formatted so it can be parsed by a human reader. This is useful if you want to
# understand what is going on. On the other hand, if this tag is set to NO, the
# size of the Perl module output will be much smaller and Perl will parse it
# just the same.
# The default value is: YES.
# This tag requires that the tag GENERATE_PERLMOD is set to YES.

PERLMOD_PRETTY         = YES

# The names of the make variables in the generated doxyrules.make file are
# prefixed with the string contained in PERLMOD_MAKEVAR_PREFIX. This is useful
# so different doxyrules.make files included by the same Makefile don't
# overwrite each other's variables.
# This tag requires that the tag GENERATE_PERLMOD is set to YES.

PERLMOD_MAKEVAR_PREFIX =

#---------------------------------------------------------------------------
# Configuration options related to the preprocessor
#---------------------------------------------------------------------------

# If the ENABLE_PREPROCESSING tag is set to YES, doxygen will evaluate all
# C-preprocessor directives found in the sources and include files.
# The default value is: YES.

ENABLE_PREPROCESSING   = YES

# If the MACRO_EXPANSION tag is set to YES, doxygen will expand all macro names
# in the source code. If set to NO, only conditional compilation will be
# performed. Macro expansion can be done in a controlled way by setting
# EXPAND_ONLY_PREDEF to YES.
# The default value is: NO.
# This tag requires that the tag ENABLE_PREPROCESSING is set to YES.

MACRO_EXPANSION        = NO

# If the EXPAND_ONLY_PREDEF and MACRO_EXPANSION tags are both set to YES then
# the macro expansion is limited to the macros specified with the PREDEFINED and
# EXPAND_AS_DEFINED tags.
# The default value is: NO.
# This tag requires that the tag ENABLE_PREPROCESSING is set to YES.

EXPAND_ONLY_PREDEF     = NO

# If the SEARCH_INCLUDES tag is set to YES, the include files in the
# INCLUDE_PATH will be searched if a #include is found.
# The default value is: YES.
# This tag requires that the tag ENABLE_PREPROCESSING is set to YES.

SEARCH_INCLUDES        = YES

# The INCLUDE_PATH tag can be used to specify one or more directories that
# contain include files that are not input files but should be processed by the
# preprocessor.
# This tag requires that the tag SEARCH_INCLUDES is set to YES.

INCLUDE_PATH           =

# You can use the INCLUDE_FILE_PATTERNS tag to specify one or more wildcard
# patterns (like *.h and *.hpp) to filter out the header-files in the
# directories. If left blank, the patterns specified with FILE_PATTERNS will be
# used.
# This tag requires that the tag ENABLE_PREPROCESSING is set to YES.

INCLUDE_FILE_PATTERNS  =

# The PREDEFINED tag can be used to specify one or more macro names that are
# defined before the preprocessor is started (similar to the -D option of e.g.
# gcc). The argument of the tag is a list of macros of the form: name or
# name=definition (no spaces). If the definition and the "=" are omitted, "=1"
# is assumed. To prevent a macro definition from being undefined via #undef or
# recursively expanded use the := operator instead of the = operator.
# This tag requires that the tag ENABLE_PREPROCESSING is set to YES.

PREDEFINED             =

# If the MACRO_EXPANSION and EXPAND_ONLY_PREDEF tags are set to YES then this
# tag can be used to specify a list of macro names that should be expanded. The
# macro definition that is found in the sources will be used. Use the PREDEFINED
# tag if you want to use a different macro definition that overrules the
# definition found in the source code.
# This tag requires that the tag ENABLE_PREPROCESSING is set to YES.

EXPAND_AS_DEFINED      =

# If the SKIP_FUNCTION_MACROS tag is set to YES then doxygen's preprocessor will
# remove all references to function-like macros that are alone on a line, have
# an all uppercase name, and do not end with a semicolon. Such function macros
# are typically used for boiler-plate code, and will confuse the parser if not
# removed.
# The default value is: YES.
# This tag requires that the tag ENABLE_PREPROCESSING is set to YES.

SKIP_FUNCTION_MACROS   = YES

#---------------------------------------------------------------------------
# Configuration options related to external references
#---------------------------------------------------------------------------

# The TAGFILES tag can be used to specify one or more tag files. For each tag
# file the location of the external documentation should be added. The format of
# a tag file without this location is as follows:
# TAGFILES = file1 file2 ...
# Adding location for the tag files is done as follows:
# TAGFILES = file1=loc1 "file2 = loc2" ...
# where loc1 and loc2 can be relative or absolute paths or URLs. See the
# section "Linking to external documentation" for more information about the use
# of tag files.
# Note: Each tag file must have a unique name (where the name does NOT include
# the path). If a tag file is not located in the directory in which doxygen is
# run, you must also specify the path to the tagfile here.

TAGFILES               =  @CPP_TAGFILE_RULE@

# When a file name is specified after GENERATE_TAGFILE, doxygen will create a
# tag file that is based on the input files it reads. See section "Linking to
# external documentation" for more information about the usage of tag files.

GENERATE_TAGFILE       =

# If the ALLEXTERNALS tag is set to YES, all external class will be listed in
# the class index. If set to NO, only the inherited external classes will be
# listed.
# The default value is: NO.

ALLEXTERNALS           = NO

# If the EXTERNAL_GROUPS tag is set to YES, all external groups will be listed
# in the modules index. If set to NO, only the current project's groups will be
# listed.
# The default value is: YES.

EXTERNAL_GROUPS        = YES

# If the EXTERNAL_PAGES tag is set to YES, all external pages will be listed in
# the related pages index. If set to NO, only the current project's pages will
# be listed.
# The default value is: YES.

EXTERNAL_PAGES         = YES

# The PERL_PATH should be the absolute path and name of the perl script
# interpreter (i.e. the result of 'which perl').
# The default file (with absolute path) is: /usr/bin/perl.

PERL_PATH              = /usr/bin/perl

#---------------------------------------------------------------------------
# Configuration options related to the dot tool
#---------------------------------------------------------------------------

# If the CLASS_DIAGRAMS tag is set to YES, doxygen will generate a class diagram
# (in HTML and LaTeX) for classes with base or super classes. Setting the tag to
# NO turns the diagrams off. Note that this option also works with HAVE_DOT
# disabled, but it is recommended to install and use dot, since it yields more
# powerful graphs.
# The default value is: YES.

CLASS_DIAGRAMS         = YES

# You can define message sequence charts within doxygen comments using the \msc
# command. Doxygen will then run the mscgen tool (see:
# http://www.mcternan.me.uk/mscgen/)) to produce the chart and insert it in the
# documentation. The MSCGEN_PATH tag allows you to specify the directory where
# the mscgen tool resides. If left empty the tool is assumed to be found in the
# default search path.

MSCGEN_PATH            =

# You can include diagrams made with dia in doxygen documentation. Doxygen will
# then run dia to produce the diagram and insert it in the documentation. The
# DIA_PATH tag allows you to specify the directory where the dia binary resides.
# If left empty dia is assumed to be found in the default search path.

DIA_PATH               =

# If set to YES the inheritance and collaboration graphs will hide inheritance
# and usage relations if the target is undocumented or is not a class.
# The default value is: YES.

HIDE_UNDOC_RELATIONS   = YES

# If you set the HAVE_DOT tag to YES then doxygen will assume the dot tool is
# available from the path. This tool is part of Graphviz (see:
# http://www.graphviz.org/), a graph visualization toolkit from AT&T and Lucent
# Bell Labs. The other options in this section have no effect if this option is
# set to NO
# The default value is: YES.

HAVE_DOT               = YES

# The DOT_NUM_THREADS specifies the number of dot invocations doxygen is allowed
# to run in parallel. When set to 0 doxygen will base this on the number of
# processors available in the system. You can set it explicitly to a value
# larger than 0 to get control over the balance between CPU load and processing
# speed.
# Minimum value: 0, maximum value: 32, default value: 0.
# This tag requires that the tag HAVE_DOT is set to YES.

DOT_NUM_THREADS        = 0

# When you want a differently looking font in the dot files that doxygen
# generates you can specify the font name using DOT_FONTNAME. You need to make
# sure dot is able to find the font, which can be done by putting it in a
# standard location or by setting the DOTFONTPATH environment variable or by
# setting DOT_FONTPATH to the directory containing the font.
# The default value is: Helvetica.
# This tag requires that the tag HAVE_DOT is set to YES.

DOT_FONTNAME           = Helvetica

# The DOT_FONTSIZE tag can be used to set the size (in points) of the font of
# dot graphs.
# Minimum value: 4, maximum value: 24, default value: 10.
# This tag requires that the tag HAVE_DOT is set to YES.

DOT_FONTSIZE           = 10

# By default doxygen will tell dot to use the default font as specified with
# DOT_FONTNAME. If you specify a different font using DOT_FONTNAME you can set
# the path where dot can find it using this tag.
# This tag requires that the tag HAVE_DOT is set to YES.

DOT_FONTPATH           =

# If the CLASS_GRAPH tag is set to YES then doxygen will generate a graph for
# each documented class showing the direct and indirect inheritance relations.
# Setting this tag to YES will force the CLASS_DIAGRAMS tag to NO.
# The default value is: YES.
# This tag requires that the tag HAVE_DOT is set to YES.

CLASS_GRAPH            = YES

# If the COLLABORATION_GRAPH tag is set to YES then doxygen will generate a
# graph for each documented class showing the direct and indirect implementation
# dependencies (inheritance, containment, and class references variables) of the
# class with other documented classes.
# The default value is: YES.
# This tag requires that the tag HAVE_DOT is set to YES.

COLLABORATION_GRAPH    = YES

# If the GROUP_GRAPHS tag is set to YES then doxygen will generate a graph for
# groups, showing the direct groups dependencies.
# The default value is: YES.
# This tag requires that the tag HAVE_DOT is set to YES.

GROUP_GRAPHS           = YES

# If the UML_LOOK tag is set to YES, doxygen will generate inheritance and
# collaboration diagrams in a style similar to the OMG's Unified Modeling
# Language.
# The default value is: NO.
# This tag requires that the tag HAVE_DOT is set to YES.

UML_LOOK               = NO

# If the UML_LOOK tag is enabled, the fields and methods are shown inside the
# class node. If there are many fields or methods and many nodes the graph may
# become too big to be useful. The UML_LIMIT_NUM_FIELDS threshold limits the
# number of items for each type to make the size more manageable. Set this to 0
# for no limit. Note that the threshold may be exceeded by 50% before the limit
# is enforced. So when you set the threshold to 10, up to 15 fields may appear,
# but if the number exceeds 15, the total amount of fields shown is limited to
# 10.
# Minimum value: 0, maximum value: 100, default value: 10.
# This tag requires that the tag HAVE_DOT is set to YES.

UML_LIMIT_NUM_FIELDS   = 10

# If the TEMPLATE_RELATIONS tag is set to YES then the inheritance and
# collaboration graphs will show the relations between templates and their
# instances.
# The default value is: NO.
# This tag requires that the tag HAVE_DOT is set to YES.

TEMPLATE_RELATIONS     = NO

# If the INCLUDE_GRAPH, ENABLE_PREPROCESSING and SEARCH_INCLUDES tags are set to
# YES then doxygen will generate a graph for each documented file showing the
# direct and indirect include dependencies of the file with other documented
# files.
# The default value is: YES.
# This tag requires that the tag HAVE_DOT is set to YES.

INCLUDE_GRAPH          = YES

# If the INCLUDED_BY_GRAPH, ENABLE_PREPROCESSING and SEARCH_INCLUDES tags are
# set to YES then doxygen will generate a graph for each documented file showing
# the direct and indirect include dependencies of the file with other documented
# files.
# The default value is: YES.
# This tag requires that the tag HAVE_DOT is set to YES.

INCLUDED_BY_GRAPH      = YES

# If the CALL_GRAPH tag is set to YES then doxygen will generate a call
# dependency graph for every global function or class method.
#
# Note that enabling this option will significantly increase the time of a run.
# So in most cases it will be better to enable call graphs for selected
# functions only using the \callgraph command. Disabling a call graph can be
# accomplished by means of the command \hidecallgraph.
# The default value is: NO.
# This tag requires that the tag HAVE_DOT is set to YES.

CALL_GRAPH             = NO

# If the CALLER_GRAPH tag is set to YES then doxygen will generate a caller
# dependency graph for every global function or class method.
#
# Note that enabling this option will significantly increase the time of a run.
# So in most cases it will be better to enable caller graphs for selected
# functions only using the \callergraph command. Disabling a caller graph can be
# accomplished by means of the command \hidecallergraph.
# The default value is: NO.
# This tag requires that the tag HAVE_DOT is set to YES.

CALLER_GRAPH           = NO

# If the GRAPHICAL_HIERARCHY tag is set to YES then doxygen will graphical
# hierarchy of all classes instead of a textual one.
# The default value is: YES.
# This tag requires that the tag HAVE_DOT is set to YES.

GRAPHICAL_HIERARCHY    = YES

# If the DIRECTORY_GRAPH tag is set to YES then doxygen will show the
# dependencies a directory has on other directories in a graphical way. The
# dependency relations are determined by the #include relations between the
# files in the directories.
# The default value is: YES.
# This tag requires that the tag HAVE_DOT is set to YES.

DIRECTORY_GRAPH        = YES

# The DOT_IMAGE_FORMAT tag can be used to set the image format of the images
# generated by dot. For an explanation of the image formats see the section
# output formats in the documentation of the dot tool (Graphviz (see:
# http://www.graphviz.org/)).
# Note: If you choose svg you need to set HTML_FILE_EXTENSION to xhtml in order
# to make the SVG files visible in IE 9+ (other browsers do not have this
# requirement).
# Possible values are: png, png:cairo, png:cairo:cairo, png:cairo:gd, png:gd,
# png:gd:gd, jpg, jpg:cairo, jpg:cairo:gd, jpg:gd, jpg:gd:gd, gif, gif:cairo,
# gif:cairo:gd, gif:gd, gif:gd:gd, svg, png:gd, png:gd:gd, png:cairo,
# png:cairo:gd, png:cairo:cairo, png:cairo:gdiplus, png:gdiplus and
# png:gdiplus:gdiplus.
# The default value is: png.
# This tag requires that the tag HAVE_DOT is set to YES.

DOT_IMAGE_FORMAT       = png

# If DOT_IMAGE_FORMAT is set to svg, then this option can be set to YES to
# enable generation of interactive SVG images that allow zooming and panning.
#
# Note that this requires a modern browser other than Internet Explorer. Tested
# and working are Firefox, Chrome, Safari, and Opera.
# Note: For IE 9+ you need to set HTML_FILE_EXTENSION to xhtml in order to make
# the SVG files visible. Older versions of IE do not have SVG support.
# The default value is: NO.
# This tag requires that the tag HAVE_DOT is set to YES.

INTERACTIVE_SVG        = NO

# The DOT_PATH tag can be used to specify the path where the dot tool can be
# found. If left blank, it is assumed the dot tool can be found in the path.
# This tag requires that the tag HAVE_DOT is set to YES.

DOT_PATH               =

# The DOTFILE_DIRS tag can be used to specify one or more directories that
# contain dot files that are included in the documentation (see the \dotfile
# command).
# This tag requires that the tag HAVE_DOT is set to YES.

DOTFILE_DIRS           =

# The MSCFILE_DIRS tag can be used to specify one or more directories that
# contain msc files that are included in the documentation (see the \mscfile
# command).

MSCFILE_DIRS           =

# The DIAFILE_DIRS tag can be used to specify one or more directories that
# contain dia files that are included in the documentation (see the \diafile
# command).

DIAFILE_DIRS           =

# When using plantuml, the PLANTUML_JAR_PATH tag should be used to specify the
# path where java can find the plantuml.jar file. If left blank, it is assumed
# PlantUML is not used or called during a preprocessing step. Doxygen will
# generate a warning when it encounters a \startuml command in this case and
# will not generate output for the diagram.

PLANTUML_JAR_PATH      =

# When using plantuml, the specified paths are searched for files specified by
# the !include statement in a plantuml block.

PLANTUML_INCLUDE_PATH  =

# The DOT_GRAPH_MAX_NODES tag can be used to set the maximum number of nodes
# that will be shown in the graph. If the number of nodes in a graph becomes
# larger than this value, doxygen will truncate the graph, which is visualized
# by representing a node as a red box. Note that doxygen if the number of direct
# children of the root node in a graph is already larger than
# DOT_GRAPH_MAX_NODES then the graph will not be shown at all. Also note that
# the size of a graph can be further restricted by MAX_DOT_GRAPH_DEPTH.
# Minimum value: 0, maximum value: 10000, default value: 50.
# This tag requires that the tag HAVE_DOT is set to YES.

DOT_GRAPH_MAX_NODES    = 50

# The MAX_DOT_GRAPH_DEPTH tag can be used to set the maximum depth of the graphs
# generated by dot. A depth value of 3 means that only nodes reachable from the
# root by following a path via at most 3 edges will be shown. Nodes that lay
# further from the root node will be omitted. Note that setting this option to 1
# or 2 may greatly reduce the computation time needed for large code bases. Also
# note that the size of a graph can be further restricted by
# DOT_GRAPH_MAX_NODES. Using a depth of 0 means no depth restriction.
# Minimum value: 0, maximum value: 1000, default value: 0.
# This tag requires that the tag HAVE_DOT is set to YES.

MAX_DOT_GRAPH_DEPTH    = 0

# Set the DOT_TRANSPARENT tag to YES to generate images with a transparent
# background. This is disabled by default, because dot on Windows does not seem
# to support this out of the box.
#
# Warning: Depending on the platform used, enabling this option may lead to
# badly anti-aliased labels on the edges of a graph (i.e. they become hard to
# read).
# The default value is: NO.
# This tag requires that the tag HAVE_DOT is set to YES.

DOT_TRANSPARENT        = NO

# Set the DOT_MULTI_TARGETS tag to YES to allow dot to generate multiple output
# files in one run (i.e. multiple -o and -T options on the command line). This
# makes dot run faster, but since only newer versions of dot (>1.8.10) support
# this, this feature is disabled by default.
# The default value is: NO.
# This tag requires that the tag HAVE_DOT is set to YES.

DOT_MULTI_TARGETS      = NO

# If the GENERATE_LEGEND tag is set to YES doxygen will generate a legend page
# explaining the meaning of the various boxes and arrows in the dot generated
# graphs.
# The default value is: YES.
# This tag requires that the tag HAVE_DOT is set to YES.

GENERATE_LEGEND        = YES

# If the DOT_CLEANUP tag is set to YES, doxygen will remove the intermediate dot
# files that are used to generate the various graphs.
# The default value is: YES.
# This tag requires that the tag HAVE_DOT is set to YES.

DOT_CLEANUP            = YES


================================================
FILE: doc/general/DoxygenLayout.xml
================================================
<doxygenlayout version="1.0">
  <!-- Customized for gtirb main based on doxygen 1.8.14 -->
  <!-- Navigation index tabs for HTML output -->
  <navindex>
    <tab type="mainpage" visible="yes" title=""/>
    <tab type="pages" visible="no"/>
    <tab type="usergroup" visible="yes" title="More Information" url="">
      <tab type="user" visible="yes" title="Frequently Asked Questions" url="@ref md_FAQ"/>
      <tab type="user" visible="yes" title="Binary Representation with GTIRB" url="@ref md_binary-representation"/>
      <tab type="user" visible="yes" title="Using Serialized GTIRB Data" url="@ref md_PROTOBUF"/>
      <tab type="user" visible="yes" title="Advice on when to Place ICFG Edges" url="@ref md_CFG-Edges"/>
      <tab type="user" visible="yes" title="Standard AuxData Schemata" url="@ref md_AuxData"/>
      <tab type="user" visible="yes" title="Contributing" url="@ref md_CONTRIBUTING"/>
      <tab type="user" visible="yes" title="Tutorial: Stack Stamping" url="@ref md_stack-stamp"/>
    </tab>

    <tab type="usergroup" visible="yes" title="GTIRB Tools">
      <tab type="user" visible="yes" title="Disassembler (ddisasm)" url="https://github.com/GrammaTech/ddisasm">
      </tab>
      <tab type="user" visible="yes" title="Ghidra Plugin (gtirb-ghidra-plugin)" url="https://github.com/GrammaTech/gtirb-ghidra-plugin">
      </tab>
      <tab type="user" visible="yes" title="Pretty Printer (gtirb-pprinter)" url="https://github.com/GrammaTech/gtirb-pprinter">
      </tab>
    </tab>

    <tab type="user" visible="yes" title="API Components" url="@ref md_COMPONENTS"/>

    <tab type="usergroup" visible="yes" title="API Implementations">
       <tab type="user" visible="@CPP_API_VISIBLE@" title="C++ API" url="cpp/index.html"/>
       <tab type="user" visible="@PY_API_VISIBLE@" title="Python API" url="python/index.html"/>
       <tab type="user" visible="@CL_API_VISIBLE@" title="Common Lisp API" url="cl/index.html"/>
       <tab type="user" visible="@JAVA_API_VISIBLE@" title="Java API" url="java/index.html"/>
    </tab>

    <tab type="examples" visible="yes" title="" intro=""/>
  </navindex>

  <!-- Layout definition for a class page -->
  <class>
    <briefdescription visible="yes"/>
    <includes visible="$SHOW_INCLUDE_FILES"/>
    <inheritancegraph visible="$CLASS_GRAPH"/>
    <collaborationgraph visible="$COLLABORATION_GRAPH"/>
    <memberdecl>
      <nestedclasses visible="yes" title=""/>
      <publictypes title=""/>
      <services title=""/>
      <interfaces title=""/>
      <publicslots title=""/>
      <signals title=""/>
      <publicmethods title=""/>
      <publicstaticmethods title=""/>
      <publicattributes title=""/>
      <publicstaticattributes title=""/>
      <protectedtypes title=""/>
      <protectedslots title=""/>
      <protectedmethods title=""/>
      <protectedstaticmethods title=""/>
      <protectedattributes title=""/>
      <protectedstaticattributes title=""/>
      <packagetypes title=""/>
      <packagemethods title=""/>
      <packagestaticmethods title=""/>
      <packageattributes title=""/>
      <packagestaticattributes title=""/>
      <properties title=""/>
      <events title=""/>
      <privatetypes title=""/>
      <privateslots title=""/>
      <privatemethods title=""/>
      <privatestaticmethods title=""/>
      <privateattributes title=""/>
      <privatestaticattributes title=""/>
      <friends title=""/>
      <related title="" subtitle=""/>
      <membergroups visible="yes"/>
    </memberdecl>
    <detaileddescription title=""/>
    <memberdef>
      <inlineclasses title=""/>
      <typedefs title=""/>
      <enums title=""/>
      <services title=""/>
      <interfaces title=""/>
      <constructors title=""/>
      <functions title=""/>
      <related title=""/>
      <variables title=""/>
      <properties title=""/>
      <events title=""/>
    </memberdef>
    <allmemberslink visible="yes"/>
    <usedfiles visible="$SHOW_USED_FILES"/>
    <authorsection visible="yes"/>
  </class>

  <!-- Layout definition for a namespace page -->
  <namespace>
    <briefdescription visible="yes"/>
    <memberdecl>
      <nestednamespaces visible="yes" title=""/>
      <constantgroups visible="yes" title=""/>
      <classes visible="yes" title=""/>
      <typedefs title=""/>
      <enums title=""/>
      <functions title=""/>
      <variables title=""/>
      <membergroups visible="yes"/>
    </memberdecl>
    <detaileddescription title=""/>
    <memberdef>
      <inlineclasses title=""/>
      <typedefs title=""/>
      <enums title=""/>
      <functions title=""/>
      <variables title=""/>
    </memberdef>
    <authorsection visible="yes"/>
  </namespace>

  <!-- Layout definition for a file page -->
  <file>
    <briefdescription visible="yes"/>
    <includes visible="$SHOW_INCLUDE_FILES"/>
    <includegraph visible="$INCLUDE_GRAPH"/>
    <includedbygraph visible="$INCLUDED_BY_GRAPH"/>
    <sourcelink visible="yes"/>
    <memberdecl>
      <classes visible="yes" title=""/>
      <namespaces visible="yes" title=""/>
      <constantgroups visible="yes" title=""/>
      <defines title=""/>
      <typedefs title=""/>
      <enums title=""/>
      <functions title=""/>
      <variables title=""/>
      <membergroups visible="yes"/>
    </memberdecl>
    <detaileddescription title=""/>
    <memberdef>
      <inlineclasses title=""/>
      <defines title=""/>
      <typedefs title=""/>
      <enums title=""/>
      <functions title=""/>
      <variables title=""/>
    </memberdef>
    <authorsection/>
  </file>

  <!-- Layout definition for a group page -->
  <group>
    <briefdescription visible="yes"/>
    <groupgraph visible="$GROUP_GRAPHS"/>
    <memberdecl>
      <nestedgroups visible="yes" title=""/>
      <dirs visible="yes" title=""/>
      <files visible="yes" title=""/>
      <namespaces visible="yes" title=""/>
      <classes visible="yes" title=""/>
      <defines title=""/>
      <typedefs title=""/>
      <enums title=""/>
      <enumvalues title=""/>
      <functions title=""/>
      <variables title=""/>
      <signals title=""/>
      <publicslots title=""/>
      <protectedslots title=""/>
      <privateslots title=""/>
      <events title=""/>
      <properties title=""/>
      <friends title=""/>
      <membergroups visible="yes"/>
    </memberdecl>
    <detaileddescription title=""/>
    <memberdef>
      <pagedocs/>
      <inlineclasses title=""/>
      <defines title=""/>
      <typedefs title=""/>
      <enums title=""/>
      <enumvalues title=""/>
      <functions title=""/>
      <variables title=""/>
      <signals title=""/>
      <publicslots title=""/>
      <protectedslots title=""/>
      <privateslots title=""/>
      <events title=""/>
      <properties title=""/>
      <friends title=""/>
    </memberdef>
    <authorsection visible="yes"/>
  </group>

  <!-- Layout definition for a directory page -->
  <directory>
    <briefdescription visible="yes"/>
    <directorygraph visible="yes"/>
    <memberdecl>
      <dirs visible="yes"/>
      <files visible="yes"/>
    </memberdecl>
    <detaileddescription title=""/>
  </directory>
</doxygenlayout>


================================================
FILE: doc/general/IR.md
================================================
IR
==========

**IR** describes the *internal representation* of a software artifact.

The corresponding Protobuf message type is `IR`.


Guaranteed Properties
---------------------

- An **IR** is a [Node](Node.md).

- Each **IR** object must be an [AuxDataContainer](AuxDataContainer.md).

- There must be functionality to save an **IR** object to a file, and
  to load an **IR** object from a file. This functionality is allowed
  to fail if the object's **version** does not match the [GTIRB
  Protobuf version for the API as a whole](Version.md).

- Each **IR** object must have the following information, and the API
  must provide functionality for getting and setting each.
  - The applicable Protobuf **version**.
    The default value for new **IR** objects should match the
    [GTIRB Protobuf version for the API as a whole](Version.md).
  - The **modules** in the representation, as a collection of
    [Module](Module.md) objects. The collection order will depend on
    the API language.
  - The **control flow graph** [(CFG)](CFG.md).


API Implementations
--------------------

The guaranteed functionality is provided as follows.

### IR Classes and AuxDataContainer functionality

| Language    | IR Class  | [AuxDataContainer](AuxDataContainer.md) functionality              |
|:------------|:----------|:-------------------------------------------------------------------|
| C++         | gtirb::IR | by inheritance: gtirb::IR is a subclass of gtirb::AuxDataContainer |
| Python      | gtirb.IR  | by inheritance: gtirb.IR is a subclass of gtirb.AuxDataContainer   |
| Common Lisp | **gtirb** | via **aux-data** class and specializations **aux-data** (*object* *gtirb*) => *result*, (setf (**aux-data** (*object* *gtirb*)) *new-value*) |


### GTIRB Protobuf API Version


| Language    | Get Version             | Set Version             |
|:------------|:------------------------|:------------------------|
| C++         | gtirb::IR::getVersion() | gtirb::IR::setVersion() |
| Python      | read gtirb.IR.version   | write gtirb.IR.version  |
| Common Lisp | **version** (*obj* *gtirb*) => *result* | (setf (**version** (*obj* *gtirb*)) *new*) |


### File Save/Load

| Language    | Save IR to file         | Load IR from file            |
|:------------|:------------------------|:------------------------|
| C++         | gtirb::IR::save(), gtirb::IR::saveJSON() | gtirb::IR::load(), gtirb::IR::loadJSON() |
| Python      | gtirb.IR.save_protobuf(), gtirb.IR.save_protobuf_file() | gtirb.IR.load_protobuf(), gtirb.IR.load_protobuf_file() |
| Common Lisp |  **write-gtirb** *gtirb* *path* => *result* | **read-gtirb** *path* => *result* |


### Get and Set Modules

| Language    | Get Modules                          | Set Modules            |
|-------------|:-------------------------------------|:-----------------------|
| C++         | gtirb::IR::modules()                 | gtirb::IR:: gtirb::IR::addModule(), gtirb::IR::removeModule() |
| Python      | read gtirb.IR.modules                | write gtirb.IR.modules |
| Common Lisp | **modules** (*object* *gtirb*) => result | (setf (**modules** (*object* *gtirb*)) *new-value*) |


### CFG


| Language    | Get CFG                  | Set CFG                   |
|:------------|:-------------------------|:--------------------------|
| C++         | read gtirb::IR::getCFG() | write gtirb::IR::getCFG() |
| Python      | read gtirb.IR.cfg        | write gtirb.IR.cfg        |
| Common Lisp | **cfg** (*object* *gtirb*) => *result* | (setf (**cfg** (*object* *gtirb*)) *new-value*) |


Links
--------------------

- [GTIRB Components](COMPONENTS.md)
- [Using Serialized GTIRB Data](../../PROTOBUF.md)


================================================
FILE: doc/general/Module.md
================================================
Module
=======

A **Module** represents a single binary (library or executable).

The corresponding Protobuf message type is `Module`.


Guaranteed Properties
---------------------

- A **Module** is a [Node](Node.md).

- Each **Module** object must be an
  [AuxDataContainer](AuxDataContainer.md).

- Each **Module** object must have the following information, and the
  API must provide functionality for getting and setting each.
  - **binary_path**
  - **preferred_addr**
  - **rebase_delta**
  - **file_format**
  - **isa**
  - **name** (as a non-empty string)
  - **sections** (as a collection of [Section](Section.md), order
      defined by target language)
  - **symbols** (as a collection of [Symbol](Symbol.md), order defined
      by target language)
  - **proxy_blocks** (as a collection of [ProxyBlock](ProxyBlock.md),
      order defined by target language)
  - **entry_point** (as a [CodeBlock](CodeBlock.md), or null if empty)

- Functionality for conversion to and from a Protobuf message of type
  `Module` must be provided, and must account for the required fields
  listed above.

- Each **Module** must belong to either zero (0) or one (1)
  [IR](IR.md) objects. The owning **IR** must be stored as a
  reference.
  - This reference may be null, in which case the **Module**
    is freestanding and does not belong to any **IR**.
  - The reference must be readable.
  - If the reference is writable, setting it must automatically update
    the module sets for the affected **IR** object or objects (there
    will be at most two).

- The following operations must be available for the set of
  [Section](Section.md) objects in the **Module**.
  - Find all **Section** objects that intersect a given address or
    range of addresses.
  - Find all **Section** objects that begin at a given address or
    range of addresses. This operation must complete in O(log n) time,
    where m is the size of the returned set and n is the number of
    **Section** objects in the **Module**.


## API Implementations

The guaranteed functionality is provided as follows.


### Module Classes and AuxDataContainer functionality

| Language    | Module Class  | [AuxDataContainer](AuxDataContainer.md) functionality |
|:------------|:--------------|:-------------------------------|
| C++         | gtirb::Module | by inheritance: gtirb::Module is a subclass of gtirb::AuxDataContainer |
| Python      | gtirb.Module  | by inheritance: gtirb.Module is a subclass of gtirb.AuxDataContainer |
| Common Lisp | **module**    | via **aux-data** class and specializations **aux-data** (*object* *module*) => *result*, (setf (**aux-data** (*object* *module*)) *new-value*) |


### Required Field Getters/Setters


#### binary_path

| Language    | Get binary_path | Set binary_path |
|:------------|:----------------|:----------------|
| C++         | gtirb::Module::getBinaryPath() | gtirb::Module::setBinaryPath() |
| Python      | read gtirb.Module.binary_path  | write gtirb.Module.binary_path |
| Common Lisp | **binary-path** (*obj* *module*) => *result* | (setf (**binary-path** (*obj* *module*)) *new*) |


#### preferred_addr

| Language    | Get preferred_addr | Set preferred_addr  |
|:------------|:-------------------|:--------------------|
| C++         | gtirb::Module::getPreferredAddr() | gtirb::Module::setPreferredAddr() |
| Python      | read gtirb.Module.isa  | write gtirb.Module.isa |
| Common Lisp | **preferred-addr** (*obj* *module*) => *result* | (setf (**preferred-addr** (*obj* *module*)) *new*) |


#### rebase_delta

| Language    | Get rebase_delta | Set rebase_delta |
|:------------|:-----------------|:-----------------|
| C++         | gtirb::Module::getRebaseDelta() | gtirb::Module::setRebaseDelta() |
| Python      | read gtirb.Module.rebase_delta  | write gtirb.Module.rebase_delta |
| Common Lisp | **rebase-delta** (*obj* *module*) => *result* | (setf (**rebase-delta** (*obj* *module*)) *new*) |

#### file_format

| Language    | Get file_format | Set file_format |
|:------------|:----------------|:----------------|
| C++         | gtirb::Module::getFileFormat() | gtirb::Module::setFileFormat() |
| Python      | read gtirb.Module.file_format  | write gtirb.Module.file_format  |
| Common Lisp | **file-format** (*obj* *module*) => *result* | (setf (**file-format** (*obj* *module*)) *new*) |

#### isa

| Language    | Get isa                 | Set isa                  |
|:------------|:------------------------|:-------------------------|
| C++         | gtirb::Module::getISA() | gtirb::Module::setISA()  |
| Python      | read gtirb.Module.isa   | write gtirb.Module.isa   |
| Common Lisp | **isa** (*obj* *module*) => *result* | (setf (**isa** (*obj* *module*)) *new*) |

#### name

| Language    | Get name                 | Set name                 |
|:------------|:-------------------------|:-------------------------|
| C++         | gtirb::Module::getName() | gtirb::Module::setName() |
| Python      | read gtirb.Module.name   | write gtirb.Module.name  |
| Common Lisp | **name** (*obj* *module*) => *result* | (setf (**name** (*obj* *module*)) *new*) |

#### sections

| Language    | Get sections               | Set sections                  |
|:------------|:---------------------------|:------------------------------|
| C++         | gtirb::Module::sections()  | gtirb::Module::addSection(), gtirb::Module::removeSection() |
| Python      | read gtirb.Module.sections | write gtirb.Module.sections |
| Common Lisp | **sections** (*object* *module*) => *result* | (setf (**sections** (*object* *module*)) *new-value*) |


#### symbols

| Language    | Get symbols               | Set symbols                |
|:------------|:--------------------------|:---------------------------|
| C++         | gtirb::Module::symbols()  | gtirb::Module::addSymbol(), gtirb::Module::removeSymbol |
| Python      | read gtirb.Module.symbols | write gtirb.Module.symbols |
| Common Lisp | **symbols** (*object* *module*) => *result* | (setf (**symbols** (*object* *module*)) *new-value*) |


#### proxy_blocks

| Language    | Get proxy_blocks              | Set proxy_blocks           |
|:------------|:------------------------------|:---------------------------|
| C++         | gtirb::Module::proxy_blocks() | gtirb::Module::addProxyBlock(), gtirb::Module::removeProxyBlock() |
| Python      | read gtirb.Module.proxies     | write gtirb.Module.proxies |
| Common Lisp | **proxies** (*object* *module*) => *result* | (setf (**proxies** (*object* *module*)) *new-value*)  |

#### entry_point

| Language    | Get entry_point | Set entry_point |
|:------------|:----------------|:----------------|
| C++         | gtirb::Module::getEntryPoint() | gtirb::Module::setEntryPoint() |
| Python      | read gtirb.Module.entry_point  | write gtirb.Module.entry_point  |
| Common Lisp | **entry-point** (*obj* *module*) => *result* | setf (**entry-point** (*obj* *module*)) *new-value*) |


### Associated IR


| Language    | Associated IR                             |
|:------------|:------------------------------------------|
| C++         | gtirb::Module::getIR()                    |
| Python      | gtirb.Module.ir                           |
| Common Lisp | **gtirb** (*object* *module*) => *result* |


### Find Section Objects...

| Language    | ...that intersect an address/range | ...that begin at an address/range
|:------------|:---------------------------|:---------------------------|
| C++         | gtirb::Module::findSectionsOn() | gtirb::Module::findSectionsAt() |
| Python      | gtirb.Module.sections_in() | gtirb.Module.sections_at() |
| Common Lisp | **in-address** *object* *start-address* &optional *end-address* => *result*, then filter *result* to extract the **section** objects | **at-address** *object* *address* => *result*, then filter *result* to extract the **section** objects. [*] |

[*] Address range checking is not yet implemented for Common Lisp
**at-address**


Links
--------------------

- [GTIRB Components](COMPONENTS.md)
- [Using Serialized GTIRB Data](../../PROTOBUF.md)


================================================
FILE: doc/general/Node.md
================================================
Node
==========

**Node** is the root class for many [GTIRB components](COMPONENTS.md).


Guaranteed Properties
---------------------

- A unique identifier, **UUID**
   - The UUID is readable.

- A facility to look up Node objects by UUID.
   - Any node still reachable in memory must be retrievable by UUID.

- All APIs must implement a notion of **Node**.


API Implementations
--------------------

The guaranteed functionality is provided as follows.

| Language    | Node Class  | Retrieve UUID for Node        | Retrieve Node by UUID                    |
|-------------|-------------|-------------------------------|------------------------------------------|
| C++         | gtirb::Node | gtirb::Node::getUUID()        | gtirb::Node::getByUUID()                 |
| Python      | gtirb.Node  | gtirb.Node.uuid               | gtirb.Node.from_uuid()                   |
| Common Lisp | -           | **uuid** *object* => *result* | **get-uuid** *uuid* *object* => *result* |


Links
--------------------

- [GTIRB Components](COMPONENTS.md)
- [Using Serialized GTIRB Data](../../PROTOBUF.md)


================================================
FILE: doc/general/ProxyBlock.md
================================================
ProxyBlock
====================

A **ProxyBlock** is a placeholder that serves as the endpoint (source
or target) of a [CfgEdge](CfgEdge.md).

**ProxyBlock** objects allow the construction of CFG edges to or from
another node. For example, a call to a function in another module may
be represented by an edge that originates at the calling
[CodeBlock](CodeBlock.md) and targets a **ProxyBlock**. Another
example would be an edge that represents an indirect jump whose target
is not known.

A **ProxyBlock** does not represent any instructions and so has
neither an address nor a size.

The corresponding Protobuf message type is `ProxyBlock`.


Guaranteed Properties
---------------------

- A **ProxyBlock** is a [CfgNode](CfgNode.md).


- Each **ProxyBlock** must belong to either zero (0) or one (1)
  [Module](Module.md) objects. The owning **Module** must be stored as
  a reference.
  - This reference may be null, in which case the **ProxyBlock** is
    freestanding and does not belong to any **Module**.
  - The reference must be readable.
  - If the reference is writable, setting it must automatically update
    the **proxy_blocks** sets for the affected **Module** object or objects
    (there will be at most two).


API Implementations
--------------------

The guaranteed functionality is provided as follows.

### ProxyBlock Classes

| Language    | ProxyBlock Class  |
|:------------|:------------------|
| C++         | gtirb::ProxyBlock |
| Python      | gtirb.ProxyBlock  |
| Common Lisp | **proxy-block**   |


### Associated Module


| Language    | Associated Module                               |
|:------------|:------------------------------------------------|
| C++         | gtirb::ProxyBlock::getModule()                  |
| Python      | gtirb.ProxyBlock.module                         |
| Common Lisp | **module** (*object* *proxy-block*) => *result* |


Links
--------------------

- [GTIRB Components](COMPONENTS.md)
- [Using Serialized GTIRB Data](../../PROTOBUF.md)


================================================
FILE: doc/general/Section.md
================================================
Section
==========

A **Section** represents a named section of a binary.

The corresponding Protobuf message type is `Section`.


Guaranteed Properties
---------------------

- A **Section** is a [Node](Node.md).

- Each **Section** object must have the following information, and the API
  must provide functionality for getting and setting each.
  - **name**
  - **section_flags** (as a bitset or enumeration set)
  - **byte_intervals** (as a collection of
    [ByteInterval](ByteInterval.md), order defined by target language)

- Each **Section** must belong to either zero (0) or one (1)
  [Module](Module.md) objects. The owning **Module** must be stored as
  a reference.
  - This reference may be null, in which case the **Section** is
    freestanding and does not belong to any Module.

- The following operations must be available for the set of
  [ByteInterval](ByteInterval.md) objects in the **Section**.
  - Find all **ByteInterval** objects that intersect a given address or
    range of addresses.
  - Find all **ByteInterval** objects that begin at a given address or
    range of addresses. This operation must complete in O(M + log n) time
    where m is the size of the returned set and n is the number of
    **ByteInterval** objects in the **Section**.


API Implementations
--------------------

The guaranteed functionality is provided as follows.

### Section Classes

| Language    | Section Class  |
|:------------|:---------------|
| C++         | gtirb::Section |
| Python      | gtirb.Section  |
| Common Lisp | **section**    |


### Required Field Getters/Setters

#### name

| Language    | Get name                  | Set name                  |
|:------------|:--------------------------|:--------------------------|
| C++         | gtirb::Section::getName() | gtirb::Section::setName() |
| Python      | read gtirb.Section.name   | write gtirb.Section.name  |
| Common Lisp | **name** (*obj* *section*) => *result* | (setf (**name** (*obj* *section*)) *new*) |


#### section_flags


| Language    | Get section_flags        | Set section_flags         |
|:------------|:-------------------------|:--------------------------|
| C++         | gtirb::Section::flags()  | gtirb::Section::addFlag(), gtirb::Section::addFlags(), gtirb::Section::removeFlag() |
| Python      | read gtirb.Section.flags | write gtirb.Section.flags |
| Common Lisp | **flags** (*obj* *section*) => *result* | (setf (**flags** (*obj* *section*)) *new*)  |


#### byte_intervals


| Language    | Get byte_intervals                | Set byte_intervals |
|:------------|:----------------------------------|:-------------------|
| C++         | gtirb::Section::byte_intervals()  | gtirb::Section::addByteInterval(), gtirb::Section::removeByteInterval() |
| Python      | read gtirb.Section.byte_intervals | write gtirb.Section.byte_intervals  |
| Common Lisp | **byte-intervals** (*object* *section*) => *result* | (setf (**byte-intervals** (*object* *section*)) *new-value)* |


### Find ByteInterval Objects...

| Language    | ...that intersect an address/range | ...that begin at an address/range
|:------------|:---------------------------|:---------------------------|
| C++         | gtirb::Section::findByteIntervalsOn() | gtirb::Section::findByteIntervalsAt() |
| Python      | gtirb.Section.byte_intervals_in() | gtirb.Section.byte_intervals_at() |
| Common Lisp |  **in-address** *object* *start-address* &optional *end-address* => *result*, then filter *result* to extract the **byte-interval** objects | **at-address** *object* *address* => *result*, then filter *result* to extract the **byte-interval** objects. [*] |

[*] Address range checking is not yet implemented for Common Lisp
**at-address**


### Associated Module


| Language    | Associated Module                           |
|:------------|:--------------------------------------------|
| C++         | gtirb::Section::getModule()                 |
| Python      | gtirb.Section.module                        |
| Common Lisp | **module** (*object* *section*) => *result* |


Links
--------------------

- [GTIRB Components](COMPONENTS.md)
- [Using Serialized GTIRB Data](../../PROTOBUF.md)


================================================
FILE: doc/general/SymAddrAddr.md
================================================
SymAddrAddr
====================

A **SymAddrAddr** represents a symbolic operand of the form "(Sym1 -
Sym2) / Scale + Offset".

The corresponding Protobuf message type is `SymAddrAddr`.


Guaranteed Properties
---------------------

- **SymAddrAddr** is one of the permissible types for a
  [SymbolicExpression](SymbolicExpression.md).

- Each **SymAddrAddr** object must have the following information,
  and the API must provide functionality for getting and setting each.
  - **scale**
  - **offset**
  - **symbol1_uuid** (as a [Symbol](Symbol.md))
  - **symbol2_uuid** (as a [Symbol](Symbol.md))


API Implementations
--------------------

The guaranteed functionality is provided as follows.

### SymAddrAddr Classes

| Language    | SymAddrAddr Class  |
|:------------|:-------------------|
| C++         | gtirb::SymAddrAddr |
| Python      | gtirb.SymAddrAddr  |
| Common Lisp | **sym-addr-addr**  |


### Required Field Getters/Setters

#### scale

| Language    | Get scale       | Set scale             |
|:------------|:----------------|:----------------------|
| C++         | read gtirb::SymAddrAddr::Scale | write gtirb::SymAddrAddr::Scale |
| Python      | read gtirb.SymAddrAddr.scale | write gtirb.SymAddrAddr.scale |
| Common Lisp | **scale** (*obj* *sym-addr-addr*) => *result* | (setf (**scale** (*obj* *sym-addr-addr*)) *new*) |


#### offset

| Language    | Get offset         | Set offset    |
|:------------|:-------------------|:--------------|
| C++         | read gtirb::SymAddrAddr::Offset | write gtirb::SymAddrAddr::Offset |
| Python      | read gtirb.SymAddrAddr.offset | write gtirb.SymAddrAddr.offset |
| Common Lisp | **offset** (*obj* *sym-addr-addr*) => *result* | (setf (**offset** (*obj* *sym-addr-addr*)) *new*) |


#### symbol1_uuid

| Language    | Get symbol1_uuid    | Set symbol1_uuid   |
|:------------|:--------------------|:-----------------------|
| C++         | read gtirb::SymAddrAddr::Sym1 | write gtirb::SymAddrAddr::Sym1 |
| Python      | read gtirb.SymAddrAddr.symbol1 | write gtirb.SymAddrAddr.symbol1 |
| Common Lisp | **symbols** (*object* *symbolic-expression*) => *result*, first **symbol** in *result* | (setf (**symbols** (*object* *symbolic-expression*)) *new-value*), first **symbol** in *new-value* |


#### symbol2_uuid


| Language    | Get symbol2_uuid     | Set symbol2_uuid    |
|:------------|:---------------------|:--------------------|
| C++         | read gtirb::SymAddrAddr::Sym2  | read/write gtirb::SymAddrAddr::Sym2  |
| Python      | read gtirb.SymAddrAddr.symbol2 | read/write gtirb.SymAddrAddr.symbol2 |
| Common Lisp | **symbols** (*object* *symbolic-expression*) => *result*, second **symbol** in *result* | (setf (**symbols** (*object* *symbolic-expression*)) *new-value*), second **symbol** in *new-value* |

Links
--------------------

- [GTIRB Components](COMPONENTS.md)
- [Using Serialized GTIRB Data](../../PROTOBUF.md)


================================================
FILE: doc/general/SymAddrConst.md
================================================
SymAddrConst
====================

A **SymAddrConst** represents a symbolic operand of the form "Sym +
Offset".

The corresponding Protobuf message type is `SymAddrConst`.


Guaranteed Properties
---------------------

- **SymAddrConst** is one of the permissible types for a
  [SymbolicExpression](SymbolicExpression.md).

- Each **SymAddrConst** object must have the following information,
  and the API must provide functionality for getting and setting each.
  - **offset**
  - **symbol_uuid** (as a [Symbol](Symbol.md))


API Implementations
--------------------

The guaranteed functionality is provided as follows.

### SymAddrConst Classes

| Language    | SymAddrConst Class  |
|:------------|:--------------------|
| C++         | gtirb::SymAddrConst |
| Python      | gtirb.SymAddrConst  |
| Common Lisp | **sym-addr-const**  |


### Required Field Getters/Setters

#### offset

| Language    | Get offset          | Set offset            |
|:------------|:--------------------|:----------------------|
| C++         | read gtirb::SymAddrConst::Offset | write gtirb::SymAddrConst::Offset |
| Python      | read gtirb.SymAddrConst.offset | write gtirb.SymAddrConst.offset |
| Common Lisp | **offset** (*obj* *sym-addr-const*) => *result* | (setf (**offset** (*obj* *sym-addr-const*)) *new*) |


#### symbol_uuid

| Language    | Get symbol_uuid   | Get/Set symbol_uuid   |
|:------------|:------------------|:----------------------|
| C++         | read gtirb::SymAddrConst::Sym  | write gtirb::SymAddrConst::Sym  |
| Python      | read gtirb.SymAddrConst.symbol | read gtirb.SymAddrConst.symbol |
| Common Lisp | **symbols** (*object* *symbolic-expression*) => *result* | (setf (**symbols** (*object* *symbolic-expression*)) *new-value*) |


Links
--------------------

- [GTIRB Components](COMPONENTS.md)
- [Using Serialized GTIRB Data](../../PROTOBUF.md)


================================================
FILE: doc/general/Symbol.md
================================================
Symbol
====================

A **Symbol** maps a name to an object in the [IR](IR.md).

The corresponding Protobuf message type is `Symbol`.


Guaranteed Properties
---------------------

- A **Symbol** is a [Node](Node.md).

- Each **Section** object must have the following information, and the API
  must provide functionality for getting and setting each.
  - **name**
  - **optional_payload**: can be a [Block](Block.md) (sometimes called
    the *referent*) or an integer or null value (sometimes called the
    *value*)

- Each **Symbol** must belong to either zero (0) or one (1)
  [Module](Module.md) objects. The owning **Module** must be stored as
  a reference.
  - This reference may be null, in which case the **Symbol** is
    freestanding and does not belong to any **Module**.
  - The reference must be readable.
  - If the reference is writable, setting it must automatically update
    the **symbols** sets for the affected **Module** object or objects
    (there will be at most two).


API Implementations
--------------------

The guaranteed functionality is provided as follows.

### Symbol Classes

| Language    | Symbol Class  |
|:------------|:--------------|
| C++         | gtirb::Symbol |
| Python      | gtirb.Symbol  |
| Common Lisp | **symbol**    |


### Required Field Getters/Setters

#### name

| Language    | Get name                 | Set name                 |
|:------------|:-------------------------|:-------------------------|
| C++         | gtirb::Symbol::getName() | gtirb::Symbol::setName() |
| Python      | read gtirb.Symbol.name   | write gtirb.Symbol.name  |
| Common Lisp | **name** (*obj* *symbol*) => *result* | (setf (**name** (*obj* *symbol*)) *new*) |


#### optional_payload (referent/value)

| Language    | Get optional_payload     | Set optional_payload     |
|:------------|:-------------------------|:-------------------------|
| C++         | gtirb::Symbol::getAddress, gtirb::Symbol::getReferent() | gtirb::Symbol::setAddress(), gtirb::Symbol::setReferent() |
| Python      | read gtirb.Symbol.referent or gtirb.Symbol.value | write gtirb.Symbol.referent or gtirb.Symbol.value |
| Common Lisp | **payload** *symbol* => *result* | (setf (**payload** *symbol*) *new*) |


### Associated Module


| Language    | Associated Module                          |
|:------------|:-------------------------------------------|
| C++         | gtirb::Symbol::getModule()                 |
| Python      | gtirb.Symbol.module                        |
| Common Lisp | **module** (*object* *symbol*) => *result* |


Links
--------------------

- [GTIRB Components](COMPONENTS.md)
- [Using Serialized GTIRB Data](../../PROTOBUF.md)


================================================
FILE: doc/general/SymbolicExpression.md
================================================
SymbolicExpression
====================

A **SymbolicExpression** represents a data value or instruction
operand which should be interpreted as referring to a symbol.


Guaranteed Properties
---------------------

- A **SymbolicExpression** must be one of the following, implemented
  as either an inheritance hierarchy or a tagged union.
  - [SymStackConst](SymStackConst.md)
  - [SymAddrConst](SymAddrConst.md)
  - [SymAddrAddr](SymAddrAddr.md)

Symbolic Expression Attributes
------------------------------

Symbolic expressions have a set of assignable labels (**SymAttribute**) for
architecture and ABI specific relocation types and reference modifiers.

**SymAttribute** labels are organized by architecture with common labels,
stems, and suffixes grouped into a common base set.

For example, a symbol of the form `symbol@GOT` should be assigned the attribute
**gtirb::SymAttribute::GOT**, and a symbol of the form `symbol@GOTPAGE` assigned
both **gtirb::SymAttribute::GOT** and **gtirb::SymAttribute::PAGE**.

Note that we do not generalize or otherwise unify relocation attributes across
architectures and instead prefer an explicit mapping of attribute names to
relocation types as they appear in the assembly for each architecture. As a
result, many labels have similar names (e.g.  `HI`, `HI16`, `H`), but are
duplicated to provide an intuitive mapping.


 | Attribute  | Description                                                                                                                                                                                                                                                                                                                                                                                 |
 |------------|---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
 | **ELF**    |                                                                                                                                                                                                                                                                                                                                                                                             |
 | GOT        | Expression value is the offset of the GOT entry for a symbol from the base of the GOT.                                                                                                                                                                                                                                                                                                      |
 | GOTPC      | Expression value is the PC relative offset to GOT. Used for values referencing an implicit `_GLOBAL_OFFSET_TABLE_` symbol.                                                                                                                                                                                                                                                                  |
 | GOTOFF     | Expression value is the offset to a symbol location from the base of the GOT.                                                                                                                                                                                                                                                                                                               |
 | GOTREL     | Expression value is relative to the GOT.                                                                                                                                                                                                                                                                                                                                                    |
 | PLT        | Expression value is the offset to the PLT entry for a symbol from the current code location.                                                                                                                                                                                                                                                                                                |
 | PLTOFF     | Expression value is the offset to the PLT entry for a symbol from the base of the GOT.                                                                                                                                                                                                                                                                                                      |
 | PCREL      | Expression value is relative to the current code location.                                                                                                                                                                                                                                                                                                                                  |
 | SECREL     | Expression value is relative to the beginning of the section.                                                                                                                                                                                                                                                                                                                               |
 | TLS        | Expression value references Thead Local Storage.                                                                                                                                                                                                                                                                                                                                            |
 | TLSGD      | Expression value is the offset of the GOT entry for a `tls_index` structure. Used in Global Dynamic TLS access model (32 and 64-bit). See [ELF Handling for Thread-Local Storage](https://www.uclibc.org/docs/tls.pdf) for more details.                                                                                                                                                    |
 | TLSLD      | Expression value is the offset of the GOT entry for a `tls_index` structure. Used in Local Dynamic TLS access model (64-bit). See [ELF Handling for Thread-Local Storage](https://www.uclibc.org/docs/tls.pdf) for more details.                                                                                                                                                            |
 | TLSLDM     | Expression value is the offset of the GOT entry for a `tls_index` structure. Used in Local Dynamic TLS access model (32-bit). See [ELF Handling for Thread-Local Storage](https://www.uclibc.org/docs/tls.pdf) for more details.                                                                                                                                                            |
 | TPREL      | Expression value is the offset of a symbol relative to the TLS block. Used in the Local Executable TLS access model. Note that `TPREL` and `TPOFF` are descriptors for the same TLS access models. Use the attribute name equivalent to the syntax compatible with the target assembler. See [ELF Handling for Thread-Local Storage](https://www.uclibc.org/docs/tls.pdf) for more details. |
 | TPOFF      | Expression value is the offset of a symbol relative to the TLS block. Used in the Local Executable TLS access model. Note that `TPREL` and `TPOFF` are descriptors for the same TLS access models. Use the attribute name equivalent to the syntax compatible with the target assembler. See [ELF Handling for Thread-Local Storage](https://www.uclibc.org/docs/tls.pdf) for more details. |
 | DTPREL     | Expression value is the offset of a symbol relative to the TLS block. Used in the Local Dynamic TLS access model. Note that `DTPREL` and `DTPOFF` are descriptors for the same TLS access models. Use the attribute name equivalent to the syntax compatible with the target assembler. See [ELF Handling for Thread-Local Storage](https://www.uclibc.org/docs/tls.pdf) for more details.  |
 | DTPOFF     | Expression value is the offset of a symbol relative to the TLS block. Used in the Local Dynamic TLS access model. Note that `DTPREL` and `DTPOFF` are descriptors for the same TLS access models. Use the attribute name equivalent to the syntax compatible with the target assembler. See [ELF Handling for Thread-Local Storage](https://www.uclibc.org/docs/tls.pdf) for more details.  |
 | DTPMOD     | Expression value is an object identifier for the object containing a TLS symbol. See [ELF Handling for Thread-Local Storage](https://www.uclibc.org/docs/tls.pdf) for more details.                                                                                                                                                                                                         |
 | NTPOFF     | Expression value is a negative offset of a symbol relative to the TLS block. See [ELF Handling for Thread-Local Storage](https://www.uclibc.org/docs/tls.pdf) for more details.                                                                                                                                                                                                             |
 | TLSDESC    | Expression value is a pointer to the `tlsdesc` structure. See [RFC TLSDESC](https://www.fsfla.org/~lxoliva/writeups/TLS/RFC-TLSDESC-x86.txt)                                                                                                                                                                                                                                                |
 | TLSCALL    | Expression value is a call through the `tlsdesc` structure.                                                                                                                                                                                                                                                                                                                                 |
 | PAGE       | Expression value is a PC relative offset within a 4K page.                                                                                                                                                                                                                                                                                                                                  |
 | PAGEOFF    | Expression value is the offset within a 4K page, added to the page address to produce a complete address.                                                                                                                                                                                                                                                                                   |
 | CALL       | Specifies the expression value can only be present in a call instruction.                                                                                                                                                                                                                                                                                                                   |
 | LO         | Expression value is the low half word of an absolute symbol address; structured as [HI,LO] and [HIGHEST,HIGHER,HI,LO] for 32 and 64-bit addresses respectively.                                                                                                                                                                                                                             |
 | HI         | Expression value is the high half word of an absolute symbol address; structured as [HI,LO] and [HIGHEST,HIGHER,HI,LO] for 32 and 64-bit addresses respectively.                                                                                                                                                                                                                            |
 | HIGHER     | Expression value represents the higher half word of a symbol address; structured as [HI,LO] and [HIGHEST,HIGHER,HI,LO] for 32 and 64-bit addresses respectively.                                                                                                                                                                                                                            |
 | HIGHEST    | Expression value represents the highest word of a symbol address; structured as [HI,LO] and [HIGHEST,HIGHER,HI,LO] for 32 and 64-bit addresses respectively.                                                                                                                                                                                                                                |
 |            |                                                                                                                                                                                                                                                                                                                                                                                             |
 | **X86**    |                                                                                                                                                                                                                                                                                                                                                                                             |
 | GOTNTPOFF  | Expression value references a GOT entry with the negative offset relative to the thread-pointer (TLS block).                                                                                                                                                                                                                                                                                |
 | INDNTPOFF  | Position dependent variant of `GOTNTPOFF` (absolute address of GOT entry).                                                                                                                                                                                                                                                                                                                  |
 |            |                                                                                                                                                                                                                                                                                                                                                                                             |
 | **ARM**    |                                                                                                                                                                                                                                                                                                                                                                                             |
 | G0         | Expression value represents bits 0-15 of a 64-bit address.                                                                                                                                                                                                                                                                                                                                  |
 | G1         | Expression value represents bits 16-31 of a 64-bit address.                                                                                                                                                                                                                                                                                                                                 |
 | G2         | Expression value represents bits 32-47 of a 64-bit address.                                                                                                                                                                                                                                                                                                                                 |
 | G3         | Expression value represents bits 48-63 of a 64-bit address.                                                                                                                                                                                                                                                                                                                                 |
 | UPPER16    | Expression value represents upper 16 bits of an address.                                                                                                                                                                                                                                                                                                                                    |
 | LOWER16    | Expression value represents lower 16 bits of an address.                                                                                                                                                                                                                                                                                                                                    |
 | LO12       | Expression value represents bits 0-11 of an address.                                                                                                                                                                                                                                                                                                                                        |
 | LO14       | Expression value represents bits 0-13 of an address.                                                                                                                                                                                                                                                                                                                                        |
 | LO15       | Expression value represents bits 0-14 of an address.                                                                                                                                                                                                                                                                                                                                        |
 | HI12       | Expression value represents bits 13-24 of a 64-bit address.                                                                                                                                                                                                                                                                                                                                 |
 | HI21       | Expression value represents bits 11-31 of an address.                                                                                                                                                                                                                                                                                                                                       |
 | S          | Indicates the expression value is signed.                                                                                                                                                                                                                                                                                                                                                   |
 | PG         | Functionally identical to `PAGE`, but should be used for ARM relocations such as `:pg_hi21:symbol`.                                                                                                                                                                                                                                                                                         |
 | NC         | Indicates the linker should not check for overflow, "no check".                                                                                                                                                                                                                                                                                                                             |
 | ABS        | Indicates the expression value is an absolute address.                                                                                                                                                                                                                                                                                                                                      |
 | PREL       | Indicates the expression value is PC relative.                                                                                                                                                                                                                                                                                                                                              |
 | PREL31     | Expression value represents a 31-bit PC relative offset.                                                                                                                                                                                                                                                                                                                                    |
 | TARGET1    | Target specific relocation interpreted as either `R_ARM_ABS32` or `R_ARM_REL32`. Linker switches `--target1-rel` and `--target1-abs` switches override the default definition.                                                                                                                                                                                                              |
 | TARGET2    | Target specific relocation interpreted as either `R_ARM_ABS32` or `R_ARM_REL32` or `R_ARM_GOT_PREL`. Linker switch `--target2={rel,abs,got-rel}` overrides the default definition.                                                                                                                                                                                                          |
 | SBREL      | Expression value is a static-base-relative offset.                                                                                                                                                                                                                                                                                                                                          |
 | TLSLDO     | Debug relocation for a TLS variable.                                                                                                                                                                                                                                                                                                                                                        |
 |            |                                                                                                                                                                                                                                                                                                                                                                                             |
 | **MIPS**   |                                                                                                                                                                                                                                                                                                                                                                                             |
 | HI16       | Expression value represents the upper 16 bits of a symbol.                                                                                                                                                                                                                                                                                                                                  |
 | LO16       | Expression value represents the lower 16 bits of a symbol.                                                                                                                                                                                                                                                                                                                                  |
 | GPREL      | Expression value represents the offset from the current GP value.                                                                                                                                                                                                                                                                                                                           |
 | DISP       | Composes with `GOT` attribute for `%got_disp` relocation. GOT entry as displacement into the global data section.                                                                                                                                                                                                                                                                           |
 | OFST       | Composes with `GOT` attribute for `%got_ofst` relocation. GOT entry as offset from a page pointer.                                                                                                                                                                                                                                                                                          |
 |            |                                                                                                                                                                                                                                                                                                                                                                                             |
 | **PPC**    |                                                                                                                                                                                                                                                                                                                                                                                             |
 | H          | Expression value represents the high 16 bits of a symbol.                                                                                                                                                                                                                                                                                                                                   |
 | L          | Expression value represents the low 16 bits of a symbol.                                                                                                                                                                                                                                                                                                                                    |
 | HA         | Expression value represents the high 16 bits, _adjusted_ for corresponding signed `symbol@l` relocation.                                                                                                                                                                                                                                                                                    |
 | HIGH       | Expression value represents the high 16 bits of a symbol, with overflow check (PPC64).                                                                                                                                                                                                                                                                                                      |
 | HIGHA      | Expression value represents the hight 16 bits of a symbol, with overflow check (PPC64), _adjusted_ for corresponding signed `symbol@l` relocation.                                                                                                                                                                                                                                          |
 | HIGHERA    | Expression value represents bits 32-47 of an address, _adjusted_ for corresponding signed `symbol@l` relocation.                                                                                                                                                                                                                                                                            |
 | HIGHESTA   | Expression value represents 48-63 of an address, _adjusted_ for corresponding signed `symbol@l` relocation.                                                                                                                                                                                                                                                                                 |
 | TOCBASE    | Expression value represents the TOC base for the current object.                                                                                                                                                                                                                                                                                                                            |
 | TOC        | Expression value is the offset of the TOC entry from the base of the TOC.                                                                                                                                                                                                                                                                                                                   |
 | NOTOC      | Indicates callee clobbers the TOC register.                                                                                                                                                                                                                                                                                                                                                 |


API Implementations
--------------------

The guaranteed functionality is provided as follows.

| Language    | SymbolicExpression Implementation |
|:------------|:----------------------------------|
| C++         | gtirb::SymbolicExpression         |
| Python      | gtirb.SymbolicExpression          |
| Common Lisp | **symbolic-expression**           |


Links
--------------------

- [GTIRB Components](COMPONENTS.md)
- [Using Serialized GTIRB Data](../../PROTOBUF.md)


================================================
FILE: doc/general/Version.md
================================================
Version Information
===================

All APIs must provide functionality for retrieving the following
version information.

- The GTIRB version corresponding to the API, as a string.
- The Protobuf version supported by the API, as an integer.  This must
  match the value of the CMake `GTIRB_PROTOBUF_VERSION` variable.


API Implementations
-------------------

The required functionality is provided as follows.

| Language    | GTIRB version               | Protobuf version               |
|:------------|:----------------------------|:-------------------------------|
| C++         | macro GTIRB_VERSION_STRING  | macro GTIRB_PROTOBUF_VERSION   |
| Python      | gtirb.version.API_VERSION   | gtirb.version.PROTOBUF_VERSION |
| Common Lisp | constant **gtirb-version**  | constant **protobuf-version**  |


Links
--------------------

- [GTIRB Components](COMPONENTS.md)
- [Using Serialized GTIRB Data](../../PROTOBUF.md)


================================================
FILE: doc/general/examples.dox
================================================

///@if CPPONLY

/// \example api-walkthrough.cpp
/// Demonstrate many different elements of the GTIRB API.

/// \example data-symbols.cpp
/// Open an IR and print every symbol pointing to data.

/// \example cfg-paths.cpp
/// Open an IR and print every path from some point to some other point.

/// \example functions.cpp
/// Open an IR with function information in an auxiliary data store and print
/// every function along with the number of other functions it calls.

/// \example jumps.cpp
/// Open an IR and print the Address of every jump instruction,
/// along with the jump targets (if known).

///@endif


/// @if PY_ONLY

/// \example data-symbols.py
/// Open an IR and print every symbol pointing to data.

/// \example cfg-paths.py
/// Open an IR and print every path from some point to some other point.

/// \example show-cfg.py
/// Open an IR and draw the CFG to the screen.

/// @endif

/// @if CL_ONLY

/// \example data-symbols.lisp
/// Open an IR and print every symbol pointing to data.

/// \example cfg-paths.lisp
/// Open an IR and print every path from some point to some other point.

/// \example show-cfg.lisp
/// Open an IR and draw the CFG to a png.

/// @endif

/// \example datasymbols.java
/// Open an IR via protobuf and print every symbol pointing to data.


================================================
FILE: doc/general/images.dox
================================================
/// \image .gtirb.svg


================================================
FILE: doc/java/CMakeLists.txt
================================================
if(GTIRB_JAVA_API)
  include(UseJava)

  # ---------------------------------------------------------------------------
  # Running javadoc requires all dependencies including jar files, so generate
  # the jar file names with complete paths. What follows is identical to what is
  # in the java/CMakeLists.txt, where the names are originally generated.
  # ---------------------------------------------------------------------------

  # Use only minor version, patch versions might not be available
  string(REGEX MATCH "([^\.]+)\.([^\.]+)\.([^\.]+)" PROTOBUF_VERSION_MATCH
               ${Protobuf_VERSION}
  )
  set(PROTOBUF_MAJOR_VERSION ${CMAKE_MATCH_1})
  set(PROTOBUF_MINOR_VERSION ${CMAKE_MATCH_2})
  set(JAVA_PROTOBUF_VERSION
      "${PROTOBUF_MAJOR_VERSION}.${PROTOBUF_MINOR_VERSION}.0"
  )

  # Full path to the two needed jar files
  set(PROTOBUF_JARFILE
      "${CMAKE_BINARY_DIR}/java/protobuf-java-${JAVA_PROTOBUF_VERSION}.jar"
  )
  set(GTIRB_API_JARFILE
      "${CMAKE_BINARY_DIR}/java/gtirb_api-${GTIRB_MAJOR_VERSION}.${GTIRB_MINOR_VERSION}.${GTIRB_PATCH_VERSION}.jar"
  )

  if(WIN32)
    set(CP_SEP "\;")
  else()
    set(CP_SEP ":")
  endif()

  set(JAR_FILE_LIST "${GTIRB_API_JARFILE}${CP_SEP}${PROTOBUF_JARFILE}")

  # Set the directory that generated HTML will go into
  set(JAVADOC_DIR "${CMAKE_BINARY_DIR}/doc/html/java")

  # The javadoc command line
  add_custom_target(
    javadoc
    DEPENDS gtirb-java-api
    WORKING_DIRECTORY ${CMAKE_CURRENT_BINARY_DIR}
    COMMAND ${CMAKE_COMMAND} -E copy_directory ${GTIRB_JAVA_APIDOCS_DIR}
            ${JAVADOC_DIR}
    VERBATIM
  )

  # With this, "make doc" will also run javadoc
  add_dependencies(doc javadoc)

else()
  message(
    WARNING
      "java is not enabled. HTML documentation for the Java API will not be generated."
  )
endif()


================================================
FILE: doc/preprocmd.py
================================================
# doxygen is annoying about certain .md things so we have to
# preprocess before doxygenating
import os
import re
import sys
from functools import reduce

# Doxygen doesn't make heading anchors like it should.
#
# We can't insert them as a straight re substitution because we also
# need to make sure we're not accidentally matching something inside a
# codeblock.


def anchor_page_headings(pagetxt):
    def heading_to_anchor(headtxt):
        anchortxt = reduce(
            lambda intxt, rep: intxt.replace(rep[0], rep[1]),
            [headtxt.strip().lower()]
            + [(ch, "") for ch in (",", "/", "'", '"')]
            + [(" ", "-")],
        )
        return '<a name="{0}" id="{0}"></a>\n'.format(anchortxt)

    def incomment(txt):
        return txt.count("```") % 2 == 1

    return reduce(
        lambda intxt, rep_gp: re.sub(
            rep_gp[0],
            lambda m: (
                m.group(0)
                + (
                    ""
                    if incomment(pagetxt[: m.start()])
                    else heading_to_anchor(m.group(rep_gp[1]))
                )
            ),
            intxt,
        ),
        [
            pagetxt,
            (r"(?:(^|\n)\#+\s+)(.*?)(?:\{.*?)?\n", 2),
            (r"((?:^|\n)\S.*?)(?:\{\#.*?\}|)\n(?:(\=\=\=+|\-\-\-+)\n)", 1),
        ],
    )


# Given a Python-looking token, compute its location in the Python API
# documentation and return an HTML link.
def makePyApiLink(pymatch):
    parens = pymatch.group("parens")
    parens = parens if parens is not None else ""

    pytoken = pymatch.group("pytoken")
    basename = ".".join((pytoken.split(".")[:-1]))
    # heuristic to determine whether it's 'really' a submodule reference
    basename = "gtirb" if not basename.islower() else basename

    href = '<a href="python/{0}.html#{1}">{1}{2}</a>'.format(
        basename, pytoken, parens
    )
    return href


# Make an HTML link to an example file
def makeDoxyExampleLink(exname, linktext, pathadj):
    fname = exname.replace(".", "_8") + "-example.html"
    return '<a href="{0}{1}">{2}</a>'.format(pathadj, fname, linktext)


(infile, outfile) = sys.argv[1:3]

# This controls some of the substitutions
outdir = os.path.basename(os.path.dirname(os.path.abspath(outfile)))
indir = os.path.basename(os.path.dirname(os.path.abspath(infile)))

substitutions = [
    # .md file links to /doc/examples/*
    # become Doxygen \ref links with adjusted path component
    # (from main section) or finalized Doxygen links (otherwise)
    (
        r"\[([^]\n]*)\]\s*\(doc/examples/(.*?)\)",
        (
            lambda m: (
                '\\ref {} "{}"'.format(m.group(2), m.group(1))
                if outdir == "general"
                else makeDoxyExampleLink(m.group(2), m.group(1), "../")
            )
        ),
    ),
    # Simplify links within same directory
    (
        r"\[([^]\n]*)\]\s*\(doc/{0}/(.*?).md\)".format(outdir),
        r'\\ref md_\2 "\1"',
    ),
    (r"\[([^]\n]*)\]\s*\(doc/{0}/(.*?)\)".format(outdir), r'\\ref \2 "\1"'),
    # C++ has to be converted to doxygen \code ... \endcode
    # to get linking
    (r"```c\+\+(\n(.*\n)*?)```", r"\\code{.cpp}\1\\endcode"),
    (r"```cpp(\n(.*\n)*?)```", r"\\code{.cpp}\1\\endcode"),
    # doxygen is specifically annoying about fenced code.
    (
        r"```.*\n((?:.*\n)*?) *```",
        lambda m: "\n    " + m.group(1).replace("\n", "\n    "),
    ),
]

# adjust relative links from gtirb/doc/general/*.md to gtirb/doc/*.md
# and gtirb/*.md

if indir == "general":
    substitutions += [(r"(?<=\()\.\.\/(?:\.\.\/)?([\w-]+\.md)(?=\))", r"\1")]


pytoken_re = r"(?P<pytoken>gtirb(\.[a-zA-Z]\w*)+)(?P<parens>\([^]\n]*?\))?"
if outdir == "general":
    substitutions += [
        # Heuristic recognition of links to Python API elements
        # where a 'Python-looking token' has the form
        # described by pytoken_re
        #   heuristic 1: Python-looking token occurs in a table row
        #   whose first cell contains "Python"
        (
            r"(^|\n)\| +[^|]*?Python.*? {0} .*?\n".format(pytoken_re),
            lambda m: re.sub(pytoken_re, makePyApiLink, m.group(0)),
        ),
        #   heuristic 2: Python-looking token - optionally followed by
        #   paretheses with arbitrary contents - is link text of a link
        #   whose target is python/README.md
        (
            r"\[\s*{0}\s*\]".format(pytoken_re)
            + r"\([\w\./]*(?<=[\(\/])python\/README.md\)",
            makePyApiLink,
        ),
        # Links to other language APIs, iff those APIs are present
        # (conditional managed by Doxygen)
        (
            r"\[([^]\n]*)\]\s*\(doc/cpp/README.md\)",
            r' \\if CPP_ONLY <a href="cpp/index.html">\1</a> '
            r"\\else \1 (not available) \\endif \n",
        ),
        (
            r"\[([^]\n]*)\]\s*\((python|cl)/README.md\)",
            lambda m: (
                ' \\if {0}_ONLY  <a href="{1}/index.html">{2}</a> '
                "\\else {2} (not available) \\endif \n"
            ).format(
                "PY" if m.group(2) == "python" else "CL",
                m.group(2),
                m.group(1),
            ),
        ),
    ] + substitutions


with open(infile, "r") as infh:
    contents = infh.read()
    contents = anchor_page_headings(contents)
    contents = reduce(
        lambda intxt, rep: re.sub(rep[0], rep[1], intxt),
        [contents] + substitutions,
    )

    with open(outfile, "w") as outfh:
        outfh.write("[TOC]\n")  # insert page TOC
        outfh.write(contents)


================================================
FILE: doc/python/CMakeLists.txt
================================================
if(PYTHON)
  find_program(SPHINX_APIDOC sphinx-apidoc)

  if(WIN32)
    set(SPHINX_MAKE_CMD "./make.bat")
  else()
    set(SPHINX_MAKE_CMD "make")
  endif()

  if(SPHINX_APIDOC)
    add_custom_target(
      sphinx
      DEPENDS pygtirb
      WORKING_DIRECTORY ${CMAKE_CURRENT_BINARY_DIR}
      COMMAND
        ${SPHINX_APIDOC} ${CMAKE_BINARY_DIR}/python/gtirb --output-dir
        ${CMAKE_CURRENT_BINARY_DIR} --force --full --separate
      COMMAND ${CMAKE_COMMAND} -E copy ${CMAKE_CURRENT_SOURCE_DIR}/conf.py
              ${CMAKE_CURRENT_BINARY_DIR}/
      COMMAND ${SPHINX_MAKE_CMD} html
      COMMAND ${CMAKE_COMMAND} -E remove_directory
              ${CMAKE_BINARY_DIR}/doc/html/python
      COMMAND ${CMAKE_COMMAND} -E rename ${CMAKE_CURRENT_BINARY_DIR}/_build/html
              ${CMAKE_BINARY_DIR}/doc/html/python
      COMMENT "Generating API documentation with Sphinx"
      VERBATIM
    )
    add_dependencies(doc sphinx)
  else()
    message(
      WARNING
        "sphinx-apidoc was not found. HTML documentation for the Python API will not be generated."
    )
  endif()
endif()


================================================
FILE: doc/python/conf.py
================================================
# Configuration file for the Sphinx documentation builder.
#
# This file only contains a selection of the most common options. For a full
# list see the documentation:
# https://www.sphinx-doc.org/en/master/usage/configuration.html

# -- Path setup --------------------------------------------------------------

# If extensions (or modules to document with autodoc) are in another directory,
# add these directories to sys.path here. If the directory is relative to the
# documentation root, use os.path.abspath to make it absolute, like shown here.

import os
import sys

sys.path.insert(0, os.path.abspath("../../python"))


# -- Project information -----------------------------------------------------

project = "gtirb"
author = "Grammatech, Inc"
copyright = "2020, " + author


# -- General configuration ---------------------------------------------------

# Add any Sphinx extension module names here, as strings. They can be
# extensions coming with Sphinx (named 'sphinx.ext.*') or your custom
# ones.
extensions = [
    "sphinx.ext.autodoc",
    "sphinx.ext.viewcode",
    "sphinx.ext.todo",
    "sphinx_autodoc_typehints",
]

# Add any paths that contain templates here, relative to this directory.
templates_path = ["_templates"]

# The language for content autogenerated by Sphinx. Refer to documentation
# for a list of supported languages.
#
# This is also used if you do content translation via gettext catalogs.
# Usually you set "language" from the command line for these cases.
language = "en"

# List of patterns, relative to source directory, that match files and
# directories to ignore when looking for source files.
# This pattern also affects html_static_path and html_extra_path.
exclude_patterns = ["_build", "Thumbs.db", "**/.*"]


# -- Options for HTML output -------------------------------------------------

# The theme to use for HTML and HTML Help pages.  See the documentation for
# a list of builtin themes.
#
html_theme = "alabaster"

# Add any paths that contain custom static files (such as style sheets) here,
# relative to this directory. They are copied after the builtin static files,
# so a file named "default.css" will overwrite the builtin "default.css".
html_static_path = ["_static"]


# -- Extension configuration -------------------------------------------------

# -- Options for todo extension ----------------------------------------------

# If true, `todo` and `todoList` produce output, else they produce nothing.
todo_include_todos = True

# -- Options for autodoc extension -------------------------------------------

autoclass_content = "class"
autodoc_default_options = {
    "special-members": True,
    "exclude-members": (
        "__weakref__,"
        "__dict__,"
        "__module__,"
        "__repr__,"
        "__str__,"
        "__annotations__,"
        "__abstractmethods__,"
        "__args__,"
        "__extra__,"
        "__next_in_mro__,"
        "__orig_bases__,"
        "__origin__,"
        "__tree_hash__,"
        "__parameters__,"
        "__subclasshook__,"
    ),
}

# -- Options for typehints extension -----------------------------------------

set_type_checking_flag = False
typehints_fully_qualified = True
always_document_param_types = False


================================================
FILE: gtirbConfig.cmake.in
================================================
function(check_gtirb_branch GTIRB_BRANCH_NAME)
  if(NOT "${GTIRB_BRANCH_NAME}" STREQUAL "@PACKAGE_BRANCH@")
    message(
      SEND_ERROR
        "The requested gtirb branch ${GTIRB_BRANCH_NAME} is not the branch which was used in the gtirb build.  Gtirb's package branch was: @PACKAGE_BRANCH@."
    )
  endif()
endfunction()
include("${CMAKE_CURRENT_LIST_DIR}/gtirbTargets.cmake")


================================================
FILE: include/gtirb/Addr.hpp
================================================
//===- Addr.hpp -------------------------------------------------*- C++ -*-===//
//
//  Copyright (C) 2020 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
#ifndef GTIRB_ADDR_H
#define GTIRB_ADDR_H

#include <gtirb/Export.hpp>
#include <cstddef>
#include <cstdint>
#include <iomanip>
#include <iosfwd>
#include <optional>

/// \file Addr.hpp
/// \brief Class gtirb::Addr and related functions.

namespace gtirb {
/// \brief A special class to store an Effective Address.
///
/// It is a thin wrapper around a uint64_t for 64-bit address storage. Its
/// semantics in overflow situations are the same as semantics for unsigned
/// integers.
///
/// An Addr cannot store a relative address as it cannot contain a negative
/// number.
class GTIRB_EXPORT_API Addr {
public:
  /// \brief The underlying type used to represent an Addr object.
  typedef uint64_t value_type;
  /// \brief The type used to represent a difference between two Addr objects.
  typedef int64_t difference_type;

  /// \brief Default constructor.
  constexpr Addr() noexcept : Address{0} {}

  /// \brief Explicit conversion from \c value_type to \ref Addr.
  ///
  /// \param X The address.
  constexpr explicit Addr(value_type X) noexcept : Address(X) {}

  /// \brief Explicitly convert \ref Addr to \c value_type.
  ///
  /// \return An integer representation of the \ref Addr.
  constexpr explicit operator value_type() const noexcept { return Address; }

  /// \brief Unary plus for \ref Addr. This is a noop because Addr objects
  /// represent an unsigned address value.
  ///
  /// \return A copy of the implicit \ref Addr.
  constexpr Addr operator+() const noexcept { return Addr(+Address); }

  /// \brief Unary complement for \ref Addr. Flips the value of all bits in
  /// the address.
  ///
  /// \return A copy of the implicit \ref Addr object, with all bits flipped.
  constexpr Addr operator~() const noexcept { return Addr(~Address); }

  /// \brief Preincrement for \ref Addr.
  ///
  /// \return The incremented \ref Addr.
  constexpr Addr& operator++() noexcept {
    ++Address;
    return *this;
  }

  /// \brief Postincrement for \ref Addr.
  ///
  /// \return A new \ref Addr representing the address prior to being
  /// incremented.
  constexpr Addr operator++(int) noexcept {
    Addr R(*this);
    ++Address;
    return R;
  }

  /// \brief Predecrement for \ref Addr.
  ///
  /// \return The decremented \ref Addr.
  constexpr Addr& operator--() noexcept {
    --Address;
    return *this;
  }

  /// \brief Postdecrement for \ref Addr.
  ///
  /// \return A new \ref Addr representing the address prior to being
  /// decremented.
  constexpr Addr operator--(int) noexcept {
    Addr R(*this);
    --Address;
    return R;
  }

  /// \brief Binary + operator for \ref Addr + integral offset.
  ///
  /// \param A        The \ref Addr operand to +.
  /// \param Offset   The offset to add to \p A.
  ///
  /// \return A new \ref Addr representing \p A + \p Offset.
  friend constexpr Addr operator+(const Addr& A, value_type Offset) noexcept {
    return Addr(A.Address + Offset);
  }

  /// \brief Binary + operator for integral offset + \ref Addr.
  ///
  /// \param Offset   The offset to add to \p A.
  /// \param A        The \ref Addr operand to +.
  ///
  /// \return A new \ref Addr representing \p A + \p Offset.
  friend constexpr Addr operator+(value_type Offset, const Addr& A) noexcept {
    return A + Offset;
  }

  /// \brief Add-assign for \ref Addr.
  ///
  /// \param Offset   The offset to add to the represented address.
  ///
  /// \return \c *this
  constexpr Addr& operator+=(value_type Offset) noexcept {
    Address += Offset;
    return *this;
  }

  /// \brief Binary - operator for \ref Addr - integral offset.
  ///
  /// \param A        The \ref Addr operand to -.
  /// \param Offset   The offset to subtract from \p A.
  ///
  /// \return A new \ref Addr representing  \p A - \p Offset.
  ///
  /// NB: There is no overload for Offset - Addr like there is for Offset + Addr
  /// because subtraction is not associative like addition is.
  friend constexpr Addr operator-(const Addr& A, value_type Offset) noexcept {
    return Addr(A.Address - Offset);
  }

  /// \brief Subtract-assign for \ref Addr.
  ///
  /// \param Offset   The offset to subtract from the represented address.
  ///
  /// \return \c *this
  constexpr Addr& operator-=(value_type Offset) noexcept {
    Address -= Offset;
    return *this;
  }

  /// \brief Binary - operator for \ref Addr - \ref Addr.
  ///
  /// \param A        The minuend.
  /// \param B        The subtrahend.
  ///
  /// \return         The difference \p A - \p B. NB: this is a difference type
  /// and not a valid address.
  friend constexpr difference_type operator-(const Addr& A,
                                             const Addr& B) noexcept {
    return static_cast<difference_type>(A.Address - B.Address);
  }

  /// \brief Equality operator for \ref Addr.
  friend constexpr bool operator==(const Addr& LHS, const Addr& RHS) noexcept {
    return LHS.Address == RHS.Address;
  }

  /// \brief Inquality operator for \ref Addr.
  friend constexpr bool operator!=(const Addr& LHS, const Addr& RHS) noexcept {
    return !operator==(LHS, RHS);
  }

  /// \brief Less-than operator for \ref Addr.
  friend constexpr bool operator<(const Addr& LHS, const Addr& RHS) noexcept {
    return LHS.Address < RHS.Address;
  }

  /// \brief Greater-than operator for \ref Addr.
  friend constexpr bool operator>(const Addr& LHS, const Addr& RHS) noexcept {
    return operator<(RHS, LHS);
  }

  /// \brief Less-than-or-equal operator for \ref Addr.
  friend constexpr bool operator<=(const Addr& LHS, const Addr& RHS) noexcept {
    return !operator<(RHS, LHS);
  }

  /// \brief Greater-than-or-equal operator for \ref Addr.
  friend constexpr bool operator>=(const Addr& LHS, const Addr& RHS) noexcept {
    return !operator<(LHS, RHS);
  }

private:
  value_type Address{0};
};

/// \brief A range of addresses.
class GTIRB_EXPORT_API AddrRange {
public:
  /// \brief Construct a range starting at \p Lower, extending up to, but not
  /// including, \p Upper.
  ///
  /// Ranges cannot have negative size, so `AddrRange(Addr(20), Addr(10))`
  /// creates a range starting at `Addr(20)` with size 0.
  ///
  /// \param Lower  first address in the range.
  /// \param Upper  address after the last address contained in the range.
  constexpr explicit AddrRange(Addr Lower, Addr Upper) noexcept
      : First(Lower), Size(Upper - (Lower < Upper ? Lower : Upper)) {}

  /// \brief Construct a range starting at \p Lower and containing a total of
  /// \p Count addresses.
  ///
  /// \param Lower  first address in the range.
  /// \param Count  number of addresses in the range.
  constexpr explicit AddrRange(Addr Lower, uint64_t Count) noexcept
      : First(Lower), Size(Count) {}

  /// \brief Equality operator for \ref AddrRange.
  constexpr bool operator==(const AddrRange& RHS) const noexcept {
    return First == RHS.First && Size == RHS.Size;
  }

  /// \brief Inequality operator for \ref AddrRange.
  constexpr bool operator!=(const AddrRange& RHS) const noexcept {
    return First != RHS.First || Size != RHS.Size;
  }

  /// \brief Inclusive lower bound of the address range.
  constexpr Addr lower() const noexcept { return First; }

  /// \brief Exclusive upper bound of the address range.
  constexpr Addr upper() const noexcept { return First + Size; }

  /// \brief Number of addresses in the range.
  constexpr uint64_t size() const noexcept { return Size; }

private:
  /// \brief The first address in the range.
  Addr First;

  /// \brief The number of bytes in the range.
  uint64_t Size;
};

template <typename T> std::optional<uint64_t> asOptionalSize(T X);

template <> std::optional<uint64_t> inline asOptionalSize(uint64_t X) {
  return X;
}

template <>
std::optional<uint64_t> inline asOptionalSize(std::optional<uint64_t> X) {
  return X;
}

/// \relates Addr
/// \brief Address range of an object.
///
/// \tparam T         Any type that specifies a range of addresses via
/// getAddress() and getSize() methods (e.g., DataBlock).
///
/// \param Object     The object to interrogate.
///
/// \return An address range (\ref AddrRange) [L, H) such that all and only the
/// addresses L <= A < H are in \p Object, or \c std::nullopt if the object's
/// addresses are not defined.
template <typename T> std::optional<AddrRange> addressRange(const T& Object) {
  if (std::optional<Addr> A = Object.getAddress()) {
    if (std::optional<uint64_t> S = Object.getSize()) {
      return AddrRange{*A, *S};
    }
  }
  return std::nullopt;
}

/// \relates Addr
/// \brief Exclusive upper limit of an object's address range.
///
/// \tparam T         Any type that specifies a range of addresses via
/// getAddress() and getSize() methods (e.g. DataBlock).
///
/// \param Object     The object to interrogate.
///
/// \return An address (\ref Addr) A such that A-1 is in \p Object and
/// A is not.
template <typename T> std::optional<Addr> addressLimit(const T& Object) {
  auto A = Object.getAddress();
  auto B = asOptionalSize(Object.getSize());
  if (A && B) {
    return *A + *B;
  }
  return std::nullopt;
}

/// \relates Addr
/// \brief Check: Does the specified object contain the specified address?
///
/// \tparam T      Any type that specifies a range of addresses via
/// getAddress() and getSize() methods (e.g. DataBlock).
///
/// \param Object  The object of interest.
/// \param Ea      The address of interest.
///
/// \return \c true if \p Ea is in the address range of \p Object, \c
/// false otherwise.
template <typename T> bool containsAddr(const T& Object, Addr Ea) {
  return Object.getAddress() <= Ea && addressLimit(Object) > Ea;
}

/// \relates Addr
/// \brief Writes an address to an output stream in hex.
///
/// This is a convenience, since this seems to be the format that is most
/// commonly used. Note that other formats can be used by casting the address
/// to a \c uint64_t and setting the formatting explicilty.
///
/// \param Stream  the stream to write to.
/// \param A       the address to write.
///
/// \return Stream.
template <typename CharT, typename Traits>
std::basic_ostream<CharT, Traits>&
operator<<(std::basic_ostream<CharT, Traits>& Stream, Addr A) {
  auto Flags = Stream.flags();
  Stream << std::setbase(16) << std::showbase << static_cast<uint64_t>(A);
  Stream.flags(Flags);
  return Stream;
}

/// \relates Addr
/// \brief Writes an optional address to an output stream in hex.
///
/// This is a convenience to unwrap an Addr stored in a std::optional. If the
/// optional does not hold a valid Addr object, then <none> is printed to the
/// stream.
///
/// \param Stream  the stream to write to.
/// \param A       the optional address to write.
///
/// \return Stream.
template <typename CharT, typename Traits>
std::basic_ostream<CharT, Traits>&
operator<<(std::basic_ostream<CharT, Traits>& Stream, std::optional<Addr> A) {
  if (A)
    return Stream << *A;
  return Stream << "<none>";
}

} // namespace gtirb

namespace std {

/// \brief Hash operation for \ref Addr.
template <> struct hash<gtirb::Addr> {
  size_t operator()(const gtirb::Addr& A) const {
    return std::hash<uint64_t>{}(static_cast<uint64_t>(A));
  }
};

} // namespace std

#endif // GTIRB_ADDR_H


================================================
FILE: include/gtirb/Allocator.hpp
================================================
//===- Allocator.hpp --------------------------------------------*- C++ -*-===//
//
//  Copyright (C) 2020 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===-Addition License Information-----------------------------------------===//
//
// This file was initially written for the LLVM Compiler Infrastructure
// project where it is distributed under the University of Illinois Open Source
// License. See the LICENSE file in the project root for license terms.
//
//===----------------------------------------------------------------------===//
#ifndef GTIRB_ALLOCATOR_H
#define GTIRB_ALLOCATOR_H

#include <algorithm>
#include <cassert>
#include <cstddef>
#include <cstdint>
#include <cstdlib>
#include <iterator>
#include <utility>
#include <vector>

/// @cond INTERNAL
#ifndef GTIRB_WRAP_UTILS_IN_NAMESPACE
#define GTIRB_DEPRECATED_UTILS                                                 \
  [[deprecated("Define GTIRB_WRAP_UTILS_IN_NAMESPACE and access via the "      \
               "gtirb namespace to suppress this error.")]]
#else
#define GTIRB_DEPRECATED_UTILS
#endif
/// @endcond

namespace gtirb {

// We want clients to use the names in the gtirb namespace, so we exclude
// the allocator namespace when generating documentation.
/// @cond INTERNAL
namespace allocator {
/// @endcond

/// Returns the next power of two (in 64-bits) that is strictly greater than A.
/// Returns zero on overflow.
///
/// (Deprecated) Available in the global namespace when
/// GTIRB_WRAP_UTILS_IN_NAMESPACE is enabled.
GTIRB_DEPRECATED_UTILS inline uint64_t NextPowerOf2(uint64_t A) {
  A |= (A >> 1);
  A |= (A >> 2);
  A |= (A >> 4);
  A |= (A >> 8);
  A |= (A >> 16);
  A |= (A >> 32);
  return A + 1;
}

/// Return true if the argument is a power of two > 0 (64 bit edition.)
///
/// (Deprecated) Available in the global namespace when
/// GTIRB_WRAP_UTILS_IN_NAMESPACE is enabled.
GTIRB_DEPRECATED_UTILS constexpr inline bool isPowerOf2_64(uint64_t Value) {
  return Value && !(Value & (Value - 1));
}

/// Aligns \c Addr to \c Alignment bytes, rounding up.
///
/// Alignment should be a power of two.  This method rounds up, so
/// alignAddr(7, 4) == 8 and alignAddr(8, 4) == 8.
///
/// (Deprecated) Available in the global namespace when
/// GTIRB_WRAP_UTILS_IN_NAMESPACE is enabled.
GTIRB_DEPRECATED_UTILS inline uintptr_t alignAddr(const void* Addr,
                                                  size_t Alignment) {
  assert(Alignment && isPowerOf2_64((uint64_t)Alignment) &&
         "Alignment is not a power of two!");

  assert((uintptr_t)Addr + Alignment - 1 >= (uintptr_t)Addr);

  return (((uintptr_t)Addr + Alignment - 1) & ~(uintptr_t)(Alignment - 1));
}

/// Returns the necessary adjustment for aligning \c Ptr to \c Alignment
/// bytes, rounding up.
///
/// (Deprecated) Available in the global namespace when
/// GTIRB_WRAP_UTILS_IN_NAMESPACE is enabled.
GTIRB_DEPRECATED_UTILS inline size_t alignmentAdjustment(const void* Ptr,
                                                         size_t Alignment) {
  return alignAddr(Ptr, Alignment) - (uintptr_t)Ptr;
}

/// Allocate memory in an ever growing pool, as if by bump-pointer.
///
/// This isn't strictly a bump-pointer allocator as it uses backing slabs of
/// memory rather than relying on a boundless contiguous heap. However, it has
/// bump-pointer semantics in that it is a monotonically growing pool of memory
/// where every allocation is found by merely allocating the next N bytes in
/// the slab, or the next N bytes in the next slab.
///
/// Note that this also has a threshold for forcing allocations above a certain
/// size into their own slab.
template <size_t SlabSize = 4096, size_t SizeThreshold = SlabSize>
class GTIRB_DEPRECATED_UTILS BumpPtrAllocatorImpl {
public:
  static_assert(SizeThreshold <= SlabSize,
                "The SizeThreshold must be at most the SlabSize to ensure "
                "that objects larger than a slab go into their own memory "
                "allocation.");

  BumpPtrAllocatorImpl() = default;

  // Manually implement a move constructor as we must clear the old allocator's
  // slabs as a matter of correctness.
  BumpPtrAllocatorImpl(BumpPtrAllocatorImpl&& Old)
      : CurPtr(Old.CurPtr), End(Old.End), Slabs(std::move(Old.Slabs)),
        CustomSizedSlabs(std::move(Old.CustomSizedSlabs)),
        BytesAllocated(Old.BytesAllocated), RedZoneSize(Old.RedZoneSize) {
    Old.CurPtr = Old.End = nullptr;
    Old.BytesAllocated = 0;
    Old.Slabs.clear();
    Old.CustomSizedSlabs.clear();
  }

  ~BumpPtrAllocatorImpl() {
    DeallocateSlabs(Slabs.begin(), Slabs.end());
    DeallocateCustomSizedSlabs();
  }

  BumpPtrAllocatorImpl& operator=(BumpPtrAllocatorImpl&& RHS) {
    DeallocateSlabs(Slabs.begin(), Slabs.end());
    DeallocateCustomSizedSlabs();

    CurPtr = RHS.CurPtr;
    End = RHS.End;
    BytesAllocated = RHS.BytesAllocated;
    RedZoneSize = RHS.RedZoneSize;
    Slabs = std::move(RHS.Slabs);
    CustomSizedSlabs = std::move(RHS.CustomSizedSlabs);

    RHS.CurPtr = RHS.End = nullptr;
    RHS.BytesAllocated = 0;
    RHS.Slabs.clear();
    RHS.CustomSizedSlabs.clear();
    return *this;
  }

  /// Allocate space at the specified alignment.
  void* Allocate(size_t Size, size_t Alignment) {
    assert(Alignment > 0 && "0-byte alignnment is not allowed. Use 1 instead.");

    // Keep track of how many bytes we've allocated.
    BytesAllocated += Size;

    size_t Adjustment = alignmentAdjustment(CurPtr, Alignment);
    assert(Adjustment + Size >= Size && "Adjustment + Size must not overflow");

    size_t SizeToAllocate = Size;

    // Check if we have enough space.
    if (Adjustment + SizeToAllocate <= size_t(End - CurPtr)) {
      char* AlignedPtr = CurPtr + Adjustment;
      CurPtr = AlignedPtr + SizeToAllocate;
      return AlignedPtr;
    }

    // If Size is really big, allocate a separate slab for it.
    size_t PaddedSize = SizeToAllocate + Alignment - 1;
    if (PaddedSize > SizeThreshold) {
      void* NewSlab = std::malloc(PaddedSize);
      CustomSizedSlabs.push_back(std::make_pair(NewSlab, PaddedSize));

      uintptr_t AlignedAddr = alignAddr(NewSlab, Alignment);
      assert(AlignedAddr + Size <= (uintptr_t)NewSlab + PaddedSize);
      char* AlignedPtr = (char*)AlignedAddr;
      return AlignedPtr;
    }

    // Otherwise, start a new slab and try again.
    StartNewSlab();
    uintptr_t AlignedAddr = alignAddr(CurPtr, Alignment);
    assert(AlignedAddr + SizeToAllocate <= (uintptr_t)End &&
           "Unable to allocate memory!");
    char* AlignedPtr = (char*)AlignedAddr;
    CurPtr = AlignedPtr + SizeToAllocate;
    return AlignedPtr;
  }

  /// Allocate space for a sequence of objects without constructing them.
  template <typename T> T* Allocate(size_t Num = 1) {
    return static_cast<T*>(Allocate(Num * sizeof(T), alignof(T)));
  }

  // Bump pointer allocators are expected to never free their storage; and
  // clients expect pointers to remain valid for non-dereferencing uses even
  // after deallocation.
  void Deallocate(const void*, size_t) {}

  size_t GetNumSlabs() const { return Slabs.size() + CustomSizedSlabs.size(); }

  size_t getTotalMemory() const {
    size_t TotalMemory = 0;
    for (auto I = Slabs.begin(), E = Slabs.end(); I != E; ++I)
      TotalMemory += computeSlabSize(std::distance(Slabs.begin(), I));
    for (auto& PtrAndSize : CustomSizedSlabs)
      TotalMemory += PtrAndSize.second;
    return TotalMemory;
  }

  size_t getBytesAllocated() const { return BytesAllocated; }

  void setRedZoneSize(size_t NewSize) { RedZoneSize = NewSize; }

private:
  /// The current pointer into the current slab.
  ///
  /// This points to the next free byte in the slab.
  char* CurPtr = nullptr;

  /// The end of the current slab.
  char* End = nullptr;

  /// The slabs allocated so far.
  std::vector<void*> Slabs;

  /// Custom-sized slabs allocated for too-large allocation requests.
  std::vector<std::pair<void*, size_t>> CustomSizedSlabs;

  /// How many bytes we've allocated.
  ///
  /// Used so that we can compute how much space was wasted.
  size_t BytesAllocated = 0;

  /// The number of bytes to put between allocations when running under
  /// a sanitizer.
  size_t RedZoneSize = 1;

  static size_t computeSlabSize(size_t SlabIdx) {
    // Scale the actual allocated slab size based on the number of slabs
    // allocated. Every 128 slabs allocated, we double the allocated size to
    // reduce allocation frequency, but saturate at multiplying the slab size by
    // 2^30.
    return SlabSize * ((size_t)1 << std::min<size_t>(30, SlabIdx / 128));
  }

  /// Allocate a new slab and move the bump pointers over into the new
  /// slab, modifying CurPtr and End.
  void StartNewSlab() {
    size_t AllocatedSlabSize = computeSlabSize(Slabs.size());

    void* NewSlab = std::malloc(AllocatedSlabSize);

    Slabs.push_back(NewSlab);
    CurPtr = (char*)(NewSlab);
    End = ((char*)NewSlab) + AllocatedSlabSize;
  }

  /// Deallocate a sequence of slabs.
  void DeallocateSlabs(std::vector<void*>::iterator I,
                       std::vector<void*>::iterator E) {
    for (; I != E; ++I) {
      std::free(*I);
    }
  }

  /// Deallocate all memory for custom sized slabs.
  void DeallocateCustomSizedSlabs() {
    for (auto& PtrAndSize : CustomSizedSlabs) {
      std::free(PtrAndSize.first);
    }
  }

  template <typename T> friend class SpecificBumpPtrAllocator;
};

/// The standard BumpPtrAllocator which just uses the default template
/// parameters.
///
/// (Deprecated) Available in the global namespace when
/// GTIRB_WRAP_UTILS_IN_NAMESPACE is enabled.
typedef BumpPtrAllocatorImpl<> BumpPtrAllocator;

/// A BumpPtrAllocator that allows only elements of a specific type to be
/// allocated.
///
/// This allows calling the destructor in DestroyAll() and when the allocator is
/// destroyed.
///
/// (Deprecated) Available in the global namespace when
/// GTIRB_WRAP_UTILS_IN_NAMESPACE is enabled.
template <typename T> class GTIRB_DEPRECATED_UTILS SpecificBumpPtrAllocator {
  BumpPtrAllocator Allocator;

public:
  SpecificBumpPtrAllocator() {
    // Because SpecificBumpPtrAllocator walks the memory to call destructors,
    // it can't have red zones between allocations.
    Allocator.setRedZoneSize(0);
  }
  SpecificBumpPtrAllocator(SpecificBumpPtrAllocator&& Old)
      : Allocator(std::move(Old.Allocator)) {}
  ~SpecificBumpPtrAllocator() { DestroyAll(); }

  SpecificBumpPtrAllocator& operator=(SpecificBumpPtrAllocator&& RHS) {
    Allocator = std::move(RHS.Allocator);
    return *this;
  }

  /// Allocate space for an array of objects without constructing them.
  T* Allocate(size_t num = 1) { return Allocator.Allocate<T>(num); }

  /// Forgets all allocations from the underlying allocator, effectively
  /// leaking the memory. This is useful when the allocator is no longer needed
  /// and the operating system will be reclaiming the memory (such as at
  // program shutdown time).
  void ForgetAllocations() {
    Allocator.Slabs.clear();
    Allocator.CustomSizedSlabs.clear();
  }

private:
  /// Call the destructor of each allocated object and deallocate all but the
  /// current slab and reset the current pointer to the beginning of it, freeing
  /// all memory allocated so far.
  void DestroyAll() {
    auto DestroyElements = [](char* Begin, char* End) {
      assert(Begin == (char*)alignAddr(Begin, alignof(T)));
      for (char* Ptr = Begin; Ptr + sizeof(T) <= End; Ptr += sizeof(T))
        reinterpret_cast<T*>(Ptr)->~T();
    };

    for (auto I = Allocator.Slabs.begin(), E = Allocator.Slabs.end(); I != E;
         ++I) {
      size_t AllocatedSlabSize = BumpPtrAllocator::computeSlabSize(
          std::distance(Allocator.Slabs.begin(), I));
      char* Begin = (char*)alignAddr(*I, alignof(T));
      char* End = *I == Allocator.Slabs.back() ? Allocator.CurPtr
                                               : (char*)*I + AllocatedSlabSize;

      DestroyElements(Begin, End);
    }

    for (auto& PtrAndSize : Allocator.CustomSizedSlabs) {
      void* Ptr = PtrAndSize.first;
      size_t Size = PtrAndSize.second;
      DestroyElements((char*)alignAddr(Ptr, alignof(T)), (char*)Ptr + Size);
    }
  }
};

/// @cond INTERNAL
} // namespace allocator
/// @endcond

#ifdef GTIRB_WRAP_UTILS_IN_NAMESPACE

using allocator::alignAddr;
using allocator::alignmentAdjustment;
using allocator::BumpPtrAllocator;
using allocator::isPowerOf2_64;
using allocator::NextPowerOf2;
using allocator::SpecificBumpPtrAllocator;

#endif // GTIRB_WRAP_UTILS_IN_NAMESPACE

} // namespace gtirb

#ifndef GTIRB_WRAP_UTILS_IN_NAMESPACE

using gtirb::allocator::alignAddr;
using gtirb::allocator::alignmentAdjustment;
using gtirb::allocator::BumpPtrAllocator;
using gtirb::allocator::isPowerOf2_64;
using gtirb::allocator::NextPowerOf2;
using gtirb::allocator::SpecificBumpPtrAllocator;

#endif // GTIRB_WRAP_UTILS_IN_NAMESPACE

template <size_t SlabSize, size_t SizeThreshold>
void* operator new(size_t Size, gtirb::allocator::BumpPtrAllocatorImpl<
                                    SlabSize, SizeThreshold>& Allocator) {
  struct S {
    char c;
    union {
      double D;
      long double LD;
      long long L;
      void* P;
    } x;
  };
  return Allocator.Allocate(
      Size,
      std::min((size_t)gtirb::allocator::NextPowerOf2(Size), offsetof(S, x)));
}

template <size_t SlabSize, size_t SizeThreshold>
void operator delete(
    void*, gtirb::allocator::BumpPtrAllocatorImpl<SlabSize, SizeThreshold>&) {}

#endif // GTIRB_ALLOCATOR_H


================================================
FILE: include/gtirb/AuxData.hpp
================================================
//===- AuxData.hpp -----------------------------------------------*- C++-*-===//
//
//  Copyright (C) 2020 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
#ifndef GTIRB_AUXDATA_H
#define GTIRB_AUXDATA_H

#include <gtirb/Addr.hpp>
#include <gtirb/Node.hpp>
#include <gtirb/Offset.hpp>
#include <boost/endian/conversion.hpp>
#include <deque>
#include <iostream>
#include <list>
#include <map>
#include <set>
#include <string>
#include <type_traits>
#include <typeinfo>
#include <unordered_map>
#include <unordered_set>
#include <variant>
#include <vector>

/// \file AuxData.hpp
/// \ingroup AUXDATA_GROUP
/// \brief  Types and operations for auxiliary data.
/// \see AUXDATA_GROUP

namespace gtirb {
namespace proto {
class AuxData;
} // namespace proto
class Context;

/// \defgroup AUXDATA_GROUP AuxData
/// \brief \ref AuxData objects can be attached to the \ref IR or individual
/// \ref Modules to store additional client-specific data in a portable way.
///
/// AuxData can store the following types:
///   - all integral types
///   - Addr
///   - Offset
///   - \ref UUID
///   - sequential containers
///   - mapping containers
///   - std::tuple
///
/// ### Supporting Additional Types
///
/// Support for additional containers can be added by specializing \ref
/// is_sequence or \ref is_mapping. Once serialized, the data does not
/// depend on any specific container type, and its contents can be
/// deserialized into different containers of the same kind (e.g. \c std::list
/// to \c std::vector).
///
/// Support for other types can be added by specializing \ref auxdata_traits to
/// provide serialization functions. However, \ref AuxData containing these
/// types will not be accessible to other clients which are not compiled with
/// support for those types. It is preferable to store data using the basic
/// types whenever possible, in order to maximize interoperability.
///
///
/// ### 'Sanctioned' AuxData Tables
///
/// We specify a small number of standard AuxData table schemata to
/// support interoperability. For details, see \ref md_AuxData. C++
/// schemata for the sanctioned tables are present in \ref
/// AuxDataSchema.hpp.
///
/// ### Adding Custom AuxData Tables
///
/// Clients may add their own AuxData tables in the C++ API by
/// defining their own schemata. Schemata should be defined by
/// extending the gtirb::schema namespace. Each schema should be a
/// struct declaring public members for the type's name and its C++
/// type. One can follow the model provided by the schemata in \ref
/// AuxDataSchema.hpp.
///
/// ### Serialization Format
///
/// AuxData is serialized by packing the contents into a byte array, which
/// is stored in a protobuf message along with a string which identifies the
/// type in a portable fashion.
///
/// Fixed-size types such as integers, Addr, etc are packed by swapping their
/// bytes to little-endian order and writing them directly to the byte
/// array. Containers first write out the number of elements (as a uint64_t),
/// then write each element one after another. Tuples are similar but omit
/// the size, since it can be inferred from the type.

/// @{

/// \struct is_sequence
///
/// \brief Trait class that identifies whether T is a sequential
/// container type.
///
/// \see AUXDATA_GROUP
template <class T> struct is_sequence : std::false_type {};

/// @cond INTERNAL
template <class T> struct is_sequence<std::vector<T>> : std::true_type {};
template <class T> struct is_sequence<std::list<T>> : std::true_type {};
template <class T> struct is_sequence<std::deque<T>> : std::true_type {};
/// @endcond

/// \struct is_mapping
///
/// \brief Trait class that identifies whether T is a mapping container type.
///
/// \see AUXDATA_GROUP
template <class T> struct is_mapping : std::false_type {};
/// @cond INTERNAL
template <class T, class U>
struct is_mapping<std::map<T, U>> : std::true_type {};
template <class T, class U>
struct is_mapping<std::unordered_map<T, U>> : std::true_type {};
// Explicitly disable multimaps. Because they can contain multiple values for
// a given key, they can't be used interchangeably with maps.
template <class T, class U>
struct is_mapping<std::multimap<T, U>> : std::false_type {};
template <class T, class U>
struct is_mapping<std::unordered_multimap<T, U>> : std::false_type {};
/// @endcond

/// \struct is_set
///
/// \brief Trait class that identifies whether T is a set container type.
///
/// \see AUXDATA_GROUP
template <class T> struct is_set : std::false_type {};
/// @cond internal
template <class... Args> struct is_set<std::set<Args...>> : std::true_type {};
template <class... Args>
struct is_set<std::unordered_set<Args...>> : std::true_type {};
// Explicitly disable multisets. Because they can contain multiple equivalent
// values, they can't be used interchangeably with sets.
template <class... Args>
struct is_set<std::multiset<Args...>> : std::false_type {};
template <class... Args>
struct is_set<std::unordered_multiset<Args...>> : std::false_type {};
/// @endcond

/// \struct is_tuple
///
/// \brief Trait class that identifies whether T is tuple-like.
///
/// \see AUXDATA_GROUP
template <class T> struct is_tuple : std::false_type {};
/// @cond INTERNAL
template <class... Args>
struct is_tuple<std::tuple<Args...>> : std::true_type {};

template <class... Args>
struct is_tuple<std::pair<Args...>> : std::true_type {};

// Utility class for serializing AuxData.
class ToByteRange {
public:
  explicit ToByteRange(std::string& Bytes) : It(std::back_inserter(Bytes)) {}

  void write(std::byte Byte) { *It = static_cast<char>(Byte); }

private:
  std::back_insert_iterator<std::string> It;
};

// Utility class for deserializing AuxData.
class FromByteRange {
public:
  explicit FromByteRange(const std::string& Bytes)
      : Curr(Bytes.begin()), End(Bytes.end()) {}

  bool read(std::byte& Byte) {
    if (Curr == End)
      return false;

    Byte = std::byte(*Curr);
    ++Curr;
    return true;
  }

  uint64_t remainingBytesToRead() const {
    return static_cast<uint64_t>(std::distance(Curr, End));
  }

private:
  std::string::const_iterator Curr;
  std::string::const_iterator End;
};

///@endcond

/// \struct auxdata_traits
///
/// \brief Provides type information and serialization functions
/// for types which can be stored in \ref AuxData.
///
/// \see AUXDATA_GROUP
template <class T, class Enable = void> struct auxdata_traits {
  /// \brief  Serialize an object to a sequence of bytes.
  ///
  /// \param Object  The object to serialize.
  /// \param TBR     Store byte sequence here.
  static void toBytes(const T& Object, ToByteRange& TBR) = delete;

  /// \brief  Deserialize an object from a sequence of bytes.
  ///
  /// \param Object  The object to deserialize.
  /// \param FBR     Read bytes from here.
  /// \return True/false dependending on if the bytes were deserialized
  /// successfully.
  static bool fromBytes(T& Object, FromByteRange& FBR) = delete;

  /// \brief String representation of the serialized type of T.
  ///
  /// This identifier is portable and independent of the specific container
  /// types. Integral types are represented with an exact size (e.g.
  /// "uint32_t"). Sequential containers are represented as "sequence<...>", and
  /// mapping containers are represented as "mapping<...>".
  static std::string type_name() = delete;
};

/// @cond INTERNAL
template <class... Ts> struct TypeId {};

template <class T>
struct is_endian_type
    : std::integral_constant<bool, std::is_class_v<T> ||
                                       (std::is_integral_v<T> &&
                                        !std::is_same_v<T, bool>)> {};

template <typename T, typename Enable = void> struct default_serialization {};

// Serialize and deserialize by copying the object representation directly.
template <typename T>
struct default_serialization<
    T, typename std::enable_if_t<is_endian_type<T>::value ||
                                 std::is_floating_point<T>::value ||
                                 std::is_same<T, bool>::value>> {
  static void toBytes(const T& object, ToByteRange& TBR) {
    // Store as little-endian.
    T ordered = object;

    if constexpr (!std::is_floating_point<T>::value &&
                  !std::is_same<T, bool>::value) {
      // Do not reorder floating point or boolean values
      boost::endian::conditional_reverse_inplace<boost::endian::order::little,
                                                 boost::endian::order::native>(
          ordered);
    }
    auto srcBytes_begin = reinterpret_cast<const std::byte*>(&ordered);
    auto srcBytes_end = reinterpret_cast<const std::byte*>(&ordered + 1);
    std::for_each(srcBytes_begin, srcBytes_end, [&](auto b) { TBR.write(b); });
  }

  static bool fromBytes(T& object, FromByteRange& FBR) {
    auto dest_begin = reinterpret_cast<std::byte*>(&object);
    auto dest_end = reinterpret_cast<std::byte*>(&object + 1);
    bool Success = true;
    std::for_each(dest_begin, dest_end, [&](auto& b) {
      if (!FBR.read(b))
        Success = false;
    });
    if (!Success) {
      return false;
    }

    // Data stored as little-endian.
    if constexpr (!std::is_floating_point<T>::value &&
                  !std::is_same<T, bool>::value) {
      boost::endian::conditional_reverse_inplace<boost::endian::order::little,
                                                 boost::endian::order::native>(
          object);
    }

    return true;
  }
};

template <>
struct auxdata_traits<std::byte> : default_serialization<std::byte> {
  static std::string type_name() { return "byte"; }

  static void toBytes(std::byte object, ToByteRange& TBR) { TBR.write(object); }

  static bool fromBytes(std::byte& object, FromByteRange& FBR) {
    return FBR.read(object);
  }
};

template <> struct auxdata_traits<Addr> : default_serialization<Addr> {
  static std::string type_name() { return "Addr"; }
};

template <> struct auxdata_traits<UUID> : default_serialization<UUID> {
  static std::string type_name() { return "UUID"; }
};

template <class T>
struct auxdata_traits<T, typename std::enable_if_t<std::is_integral<T>::value &&
                                                   std::is_signed<T>::value>>
    : default_serialization<T> {
  static std::string type_name() {
    return "int" + std::to_string(8 * sizeof(T)) + "_t";
  }
};

template <class T>
struct auxdata_traits<T, typename std::enable_if_t<std::is_integral<T>::value &&
                                                   std::is_unsigned<T>::value>>
    : default_serialization<T> {
  static std::string type_name() {
    return "uint" + std::to_string(8 * sizeof(T)) + "_t";
  }
};

template <> struct auxdata_traits<bool> : default_serialization<bool> {
  static std::string type_name() { return "bool"; }
};

template <> struct auxdata_traits<float> : default_serialization<float> {
  static std::string type_name() { return "float"; }
};

template <> struct auxdata_traits<double> : default_serialization<double> {
  static std::string type_name() { return "double"; }
};

template <> struct auxdata_traits<std::string> {
  static std::string type_name() { return "string"; }

  static void toBytes(const std::string& Object, ToByteRange& TBR) {
    auxdata_traits<uint64_t>::toBytes(Object.size(), TBR);
    std::for_each(Object.begin(), Object.end(),
                  [&](auto& elt) { auxdata_traits<char>::toBytes(elt, TBR); });
  }

  static bool fromBytes(std::string& Object, FromByteRange& FBR) {
    uint64_t Count;
    if (!auxdata_traits<uint64_t>::fromBytes(Count, FBR))
      return false;

    if (Count > FBR.remainingBytesToRead())
      return false;

    Object.resize(Count);
    bool Success = true;
    std::for_each(Object.begin(), Object.end(), [&](auto& elt) {
      if (!auxdata_traits<char>::fromBytes(elt, FBR))
        Success = false;
    });

    return Success;
  }
};

template <> struct auxdata_traits<Offset> {
  static std::string type_name() { return "Offset"; }

  static void toBytes(const Offset& Object, ToByteRange& TBR) {
    auxdata_traits<UUID>::toBytes(Object.ElementId, TBR);
    auxdata_traits<uint64_t>::toBytes(Object.Displacement, TBR);
  }

  static bool fromBytes(Offset& Object, FromByteRange& FBR) {
    if (!auxdata_traits<UUID>::fromBytes(Object.ElementId, FBR))
      return false;
    return auxdata_traits<uint64_t>::fromBytes(Object.Displacement, FBR);
  }
};

template <class T>
struct auxdata_traits<T, typename std::enable_if_t<is_sequence<T>::value>> {
  static std::string type_name() {
    return "sequence<" + TypeId<typename T::value_type>::value() + ">";
  }

  static void toBytes(const T& Object, ToByteRange& TBR) {
    auxdata_traits<uint64_t>::toBytes(Object.size(), TBR);
    std::for_each(Object.begin(), Object.end(), [&](const auto& Elt) {
      auxdata_traits<typename T::value_type>::toBytes(Elt, TBR);
    });
  }

  static bool fromBytes(T& Object, FromByteRange& FBR) {
    uint64_t Count;
    if (!auxdata_traits<uint64_t>::fromBytes(Count, FBR))
      return false;

    if (Count > FBR.remainingBytesToRead())
      return false;

    Object.resize(Count);
    bool Success = true;
    std::for_each(Object.begin(), Object.end(), [&](auto& Elt) {
      if (!auxdata_traits<typename T::value_type>::fromBytes(Elt, FBR))
        Success = false;
    });

    return Success;
  }
};

template <class T>
struct auxdata_traits<T, typename std::enable_if_t<is_set<T>::value>> {
  static std::string type_name() {
    return "set<" + TypeId<typename T::value_type>::value() + ">";
  }

  static void toBytes(const T& Object, ToByteRange& TBR) {
    auxdata_traits<uint64_t>::toBytes(Object.size(), TBR);
    for (const auto& Elt : Object)
      auxdata_traits<typename T::value_type>::toBytes(Elt, TBR);
  }

  static bool fromBytes(T& Object, FromByteRange& FBR) {
    uint64_t Count;
    if (!auxdata_traits<uint64_t>::fromBytes(Count, FBR))
      return false;

    if (Count > FBR.remainingBytesToRead())
      return false;

    for (uint64_t i = 0; i < Count; i++) {
      typename T::value_type V;
      if (!auxdata_traits<decltype(V)>::fromBytes(V, FBR))
        return false;
      Object.emplace(std::move(V));
    }

    return true;
  }
};

template <class T>
struct auxdata_traits<T, typename std::enable_if_t<is_mapping<T>::value>> {
  static std::string type_name() {
    return "mapping<" +
           TypeId<typename T::key_type, typename T::mapped_type>::value() + ">";
  }

  static void toBytes(const T& Object, ToByteRange& TBR) {
    auxdata_traits<uint64_t>::toBytes(Object.size(), TBR);
    std::for_each(Object.begin(), Object.end(), [&](const auto& Elt) {
      auxdata_traits<typename T::key_type>::toBytes(Elt.first, TBR);
      auxdata_traits<typename T::mapped_type>::toBytes(Elt.second, TBR);
    });
  }

  static bool fromBytes(T& Object, FromByteRange& FBR) {
    uint64_t Count;
    if (!auxdata_traits<uint64_t>::fromBytes(Count, FBR))
      return false;

    if (Count > FBR.remainingBytesToRead())
      return false;

    for (uint64_t i = 0; i < Count; i++) {
      typename T::key_type K;
      if (!auxdata_traits<decltype(K)>::fromBytes(K, FBR))
        return false;
      typename T::mapped_type V;
      if (!auxdata_traits<decltype(V)>::fromBytes(V, FBR))
        return false;
      Object.emplace(std::move(K), std::move(V));
    }
    return true;
  }
};

/// \brief std::variant support
///
/// Warning!
/// Members of the union (std::variant) should be default constructable.
template <class... Args> struct auxdata_traits<std::variant<Args...>> {
  using T = std::variant<Args...>;

  static std::string type_name() {
    return "variant<" + TypeId<Args...>::value() + ">";
  }

  template <uint64_t I = 0>
  static std::optional<std::variant<Args...>> expand_type(uint64_t i) {
    if constexpr (I >= sizeof...(Args)) {
      return std::nullopt;
    } else {
      return i == 0 ? std::variant<Args...>{std::in_place_index<I>,
                                            std::variant_alternative_t<I, T>{}}
                    : expand_type<I + 1>(i - 1);
    }
  };

  static void toBytes(const T& Object, ToByteRange& TBR) {
    uint64_t Index = Object.index();
    auxdata_traits<uint64_t>::toBytes(Index, TBR);
    std::visit(
        [TBR](auto&& arg) mutable {
          auxdata_traits<typename std::remove_const<
              typename std::remove_reference<decltype(arg)>::type>::type>::
              toBytes(arg, TBR);
        },
        Object);
  }

  static bool fromBytes(T& Object, FromByteRange& FBR) {
    uint64_t Index;
    if (!auxdata_traits<uint64_t>::fromBytes(Index, FBR))
      return false;
    if (Index > FBR.remainingBytesToRead())
      return false;

    auto maybeV = expand_type(Index);
    if (!maybeV) {
      return false;
    }
    auto V = *maybeV;
    bool res_code = false;
    std::visit(
        [&res_code, &FBR](auto&& arg) mutable {
          typename std::remove_reference<decltype(arg)>::type Val;
          res_code = auxdata_traits<typename std::remove_reference<decltype(
              arg)>::type>::fromBytes(Val, FBR);
          if (!res_code)
            return;
          arg = Val;
        },
        V);
    if (!res_code)
      return false;
    Object = V;
    return true;
  }
};
/// @endcond

/// @cond INTERNAL
template <class T> struct tuple_traits {};
template <class... Ts> struct tuple_traits<std::tuple<Ts...>> {
  using Tuple = std::tuple<Ts...>;

  static std::string type_name() {
    return "tuple<" + TypeId<Ts...>::value() + ">";
  }
};

template <class... Ts> struct tuple_traits<std::pair<Ts...>> {
  using Tuple = std::tuple<Ts...>;

  static std::string type_name() {
    return "tuple<" + TypeId<Ts...>::value() + ">";
  }
};

template <class Func, size_t... Is>
constexpr void static_for(Func&& f, std::integer_sequence<size_t, Is...>) {
  (f(std::integral_constant<size_t, Is>{}), ...);
}

template <class T>
struct auxdata_traits<T, typename std::enable_if_t<is_tuple<T>::value>>
    : tuple_traits<T> {
  static void toBytes(const T& Object, ToByteRange& TBR) {
    static_for(
        [&](auto i) {
          const auto& F = std::get<i>(Object);
          auxdata_traits<std::remove_cv_t<
              std::remove_reference_t<decltype(F)>>>::toBytes(F, TBR);
        },
        std::make_index_sequence<std::tuple_size<T>::value>{});
  }

  static bool fromBytes(T& Object, FromByteRange& FBR) {
    bool Success = true;
    static_for(
        [&](auto i) {
          auto& F = std::get<i>(Object);
          if (!auxdata_traits<std::remove_cv_t<
                  std::remove_reference_t<decltype(F)>>>::fromBytes(F, FBR))
            Success = false;
        },
        std::make_index_sequence<std::tuple_size<T>::value>{});

    return Success;
  }
};
/// @endcond

/// @cond INTERNAL
template <class T> struct TypeId<T> {
  static std::string value() { return auxdata_traits<T>::type_name(); }
};

template <class T, class... Ts> struct TypeId<T, Ts...> {
  static std::string value() {
    return auxdata_traits<T>::type_name() + "," + TypeId<Ts...>::value();
  }
};
/// @endcond

/// @cond INTERNAL
class GTIRB_EXPORT_API AuxData {
public:
  /// !brief Structure containing the serialized representation of an
  /// !AuxData.
  struct SerializedForm {
    std::string RawBytes;
    std::string ProtobufType;
  };

  /// \brief Construct an empty table.
  AuxData() = default;

  virtual ~AuxData() = default;

  /// \brief Returns the serialized representation of this AuxData.
  ///
  /// If the object is newly constructed (and wasn't unserialized from
  /// protobuf), the content present in the returned structure will be
  /// empty.
  ///
  /// If the object has been modified since being unserialized, the
  /// content returned here will not incorporate those modifications.
  ///
  /// This interface is provided primarily as a means for clients to
  /// inspect the raw data of AuxData objects whose types have not
  /// been registered.
  const SerializedForm& rawData() const { return this->SF; }

  /// !brief The degenerate api type id used for AuxData types that
  /// haven't been registered.
  static constexpr std::size_t UNREGISTERED_API_TYPE_ID = 0;

  /// !brief Retrieve a type-trait-specific Id number.
  virtual std::size_t getApiTypeId() const { return UNREGISTERED_API_TYPE_ID; }

protected:
  /// \brief The protobuf message type used for serializing AuxData.
  using MessageType = proto::AuxData;

  /// \brief Initialize an AuxData from a protobuf message.
  ///
  /// \param Message     The protobuf message from which to deserialize.
  /// \param[out] Result  The AuxData to initialize.
  static void fromProtobuf(AuxData& Result, const MessageType& Message);

  /// \brief Serialize into a protobuf message.
  ///
  /// \param[out] Message  A protobuf message representing the AuxData.
  virtual void toProtobuf(MessageType* Message) const {
    toProtobuf(Message, this->SF);
  }

  // This version of protobuf accepts a SerializedForm object to
  // serialize rather than serializing AuxData's SerializedForm
  // member. This is used by AuxDataImpl to serialize a typed AuxData
  // object. We structure it this way to avoid having the AuxDataImpl
  // template (which is instantiated in client code) access
  // MessageType fields directly, which would introduce
  // dllimport/dllexport issues on Windows.
  void toProtobuf(MessageType* Message,
                  const SerializedForm& SFToSerialize) const;

  // Utility function for the AuxDataImpl template that allows us to
  // check the embedded type name in the serialized protobuf against an
  // expected typename without exposing the MessageType to clients.
  static bool checkAuxDataMessageType(const AuxData::MessageType& Message,
                                      const std::string& ExpectedName);

  // Present for testing purposes only.
  void save(std::ostream& Out) const;

  // Present for testing purposes only.
  static std::unique_ptr<AuxData>
  load(std::istream& In, std::unique_ptr<AuxData> (*FPPtr)(const MessageType&));

private:
  SerializedForm SF;

  friend class AuxDataContainer; // Friend to enable fromProtobuf.
  // Enables serialization by AuxDataContainer via containerToProtobuf.
  template <typename T> friend typename T::MessageType toProtobuf(const T&);
  friend class SerializationTestHarness; // Testing support.
};
/// @endcond

/// @cond INTERNAL
template <class Schema> class AuxDataImpl : public AuxData {
public:
  AuxDataImpl() = default;
  AuxDataImpl(typename Schema::Type&& Val) : Object(std::move(Val)){};

  /// !brief Register/retrieve a type-trait-specific Id number.
  static std::size_t staticGetApiTypeId() {
    return typeid(typename Schema::Type).hash_code();
  }

  /// \brief Retrieve a type-trait-specific Id number.
  virtual std::size_t getApiTypeId() const override {
    return staticGetApiTypeId();
  }

  const typename Schema::Type* get() const { return &Object; }

private:
  static std::unique_ptr<AuxData> fromProtobuf(const MessageType& Message) {
    // Check if the serialized type isn't compatible with the type
    // we're trying to deserialize to.
    if (!checkAuxDataMessageType(
            Message, auxdata_traits<typename Schema::Type>::type_name())) {
      return nullptr;
    }

    // Note: Do not access Message's contents here. That would introduce
    // dllexport/dllimport problems on Windows. Call the base class's
    // fromProtobuf function and then unserialize from its
    // SerializedForm structure.
    auto TypedAuxData = std::make_unique<AuxDataImpl<Schema>>();
    AuxData::fromProtobuf(*TypedAuxData, Message);
    FromByteRange FBR(TypedAuxData->rawData().RawBytes);
    if (!auxdata_traits<typename Schema::Type>::fromBytes(TypedAuxData->Object,
                                                          FBR))
      return nullptr;
    return TypedAuxData;
  }

  /// \brief Serialize into a protobuf message.
  ///
  /// \param Message     The Message to serialize into.
  virtual void toProtobuf(MessageType* Message) const override {
    // Note: Do not edit Message's contents here. That would introduce
    // dllexport/dllimport problems on Windows. Store to a
    // SerializedForm, and then call the base class's toProtobuf
    // function.
    AuxData::SerializedForm TypedSF;
    TypedSF.ProtobufType = auxdata_traits<typename Schema::Type>::type_name();
    ToByteRange TBR(TypedSF.RawBytes);
    auxdata_traits<typename Schema::Type>::toBytes(this->Object, TBR);
    AuxData::toProtobuf(Message, TypedSF);
  }

  // Present for testing purposes only.
  void save(std::ostream& Out) const { AuxData::save(Out); }

  // Present for testing purposes only.
  static std::unique_ptr<AuxDataImpl> load([[maybe_unused]] Context& C,
                                           std::istream& In) {
    return std::unique_ptr<AuxDataImpl>{
        static_cast<AuxDataImpl*>(AuxData::load(In, fromProtobuf).release())};
  }

  typename Schema::Type Object;

  friend class AuxDataContainer;         // Friend to enable to/fromProtobuf.
  friend class SerializationTestHarness; // Testing support.
};
/// @endcond

// (end \defgroup AUXDATA_GROUP)

} // namespace gtirb

#endif // GTIRB_AUXDATA_H


================================================
FILE: include/gtirb/AuxDataContainer.hpp
================================================
//===- AuxDataContainer.hpp -------------------------------------*- C++ -*-===//
//
//  Copyright (C) 2020 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//

#ifndef GTIRB_AUXDATACONTAINER_H
#define GTIRB_AUXDATACONTAINER_H

#include <gtirb/AuxData.hpp>
#include <gtirb/Node.hpp>
#include <boost/iterator/transform_iterator.hpp>
#include <boost/range/iterator_range.hpp>
#include <type_traits>

/// \file AuxDataContainer.hpp
/// \brief Class gtirb::AuxDataContainer.

namespace gtirb {

namespace proto {
class IR;
class Module;
} // namespace proto

/// @cond INTERNAL
template <typename MessageType> struct message_has_aux_data_container {
  static constexpr bool value = false;
};
template <> struct message_has_aux_data_container<proto::IR> {
  static constexpr bool value = true;
};
template <> struct message_has_aux_data_container<proto::Module> {
  static constexpr bool value = true;
};

/// \brief True if MessageType is a message that holds a \ref AuxDataContainer.
template <typename MessageType>
inline constexpr bool message_has_aux_data_container_v =
    message_has_aux_data_container<MessageType>::value;
/// @endcond

/// \class AuxDataContainer
///
/// \brief Contains the AuxData Tables and serves as a base class.

class GTIRB_EXPORT_API AuxDataContainer : public Node {
  using AuxDataSet = std::map<std::string, std::unique_ptr<gtirb::AuxData>>;

public:
  /// \name AuxData Properties
  /// @{

  /// \brief Register a type to be used with AuxData of the given name.
  template <typename Schema> static void registerAuxDataType() {
    registerAuxDataTypeInternal(Schema::Name,
                                std::make_unique<AuxDataTypeImpl<Schema>>());
  }

  /// \brief Add a new \ref AuxData, transferring ownership.
  ///
  /// \param X        The data itself.
  ///
  /// \return void
  ///
  template <typename Schema> void addAuxData(typename Schema::Type&& X) {
    // Make sure this type matches a registered type.
    assert(checkAuxDataRegistration(
               Schema::Name, AuxDataImpl<Schema>::staticGetApiTypeId()) &&
           "Attempting to add AuxData with unregistered or incorrect type.");
    this->AuxDatas[Schema::Name] =
        std::make_unique<AuxDataImpl<Schema>>(std::move(X));
  }

  /// \brief Get a reference to the underlying type stored in the \ref
  ///        AuxData by name.
  ///
  /// \return     A non-owning pointer to the data if found,
  ///             \c nullptr otherwise.
  ///
  /// Note that this function can only be used for AuxData for which a
  /// type has been registered with registerAuxDataType().
  template <typename Schema> typename Schema::Type* getAuxData() {
    return const_cast<typename Schema::Type*>(
        const_cast<const AuxDataContainer*>(this)->getAuxData<Schema>());
  }

  /// \brief Get a reference to the underlying type stored in the \ref
  ///        AuxData by name.
  ///
  /// \return     A non-owning pointer to the data if found,
  ///             \c nullptr otherwise.
  ///
  /// Note that this function can only be used for AuxData for which a
  /// type has been registered with registerAuxDataType().
  template <typename Schema> const typename Schema::Type* getAuxData() const {
    auto Found = this->AuxDatas.find(Schema::Name);

    if (Found == this->AuxDatas.end())
      return nullptr;

    AuxData& AD = *(Found->second);

    // Is the type of the AuxData registered?
    if (AD.getApiTypeId() == AuxData::UNREGISTERED_API_TYPE_ID) {
      // We can get here for two reasons:
      //
      //  1) The type is not registered. We treat this as a developer
      //  error and assert. getAuxData should only ever be called for
      //  types that are registered.
      //
      //  2) The type is registered, but the attempt to unserialized
      //  the AuxData using the registered type failed. This is a
      //  legitimate runtime error situation. An example might be
      //  loading a GTIRB file that has a previous version of the
      //  AuxData with a different type. In this situation, we don't
      //  want to assert, just return nullptr.
      assert(checkAuxDataRegistration(
                 Schema::Name, AuxDataImpl<Schema>::staticGetApiTypeId()) &&
             "Attempting to retrieve AuxData with an unregistered type.");
      return nullptr;
    }

    // Does the type match the type being requested?
    if (AD.getApiTypeId() != AuxDataImpl<Schema>::staticGetApiTypeId()) {
      assert(false && "Attempting to retrieve AuxData with incorrect type.");
      return nullptr;
    }

    // If we get here, it should be safe to downcast to the typed AuxDataImpl.
    auto& ADI = static_cast<AuxDataImpl<Schema>&>(AD);
    return ADI.get();
  }

  /// \brief Remove an \ref AuxData by schema.
  ///
  /// This will invalidate any pointers that may have been held externally.
  ///
  /// \return     \c true on success, \c false otherwise.
  ///
  /// Note that this function can only be used for AuxData for which a
  /// type has been registered with registerAuxDataType().
  template <typename Schema> bool removeAuxData() {
    assert(checkAuxDataRegistration(
               Schema::Name, AuxDataImpl<Schema>::staticGetApiTypeId()) &&
           "Attempting to remove AuxData with an unregistered type.");
    return this->AuxDatas.erase(Schema::Name) > 0;
  }

  /// \brief Remove an \ref AuxData by name.
  ///
  /// This will invalidate any pointers that may have been held externally.
  ///
  /// \return     \c true on success, \c false otherwise.
  ///
  /// Note that this function can be used for any AuxData regardless
  /// of whether or not it has a registered schema.
  bool removeAuxData(std::string Name) {
    return this->AuxDatas.erase(Name) > 0;
  }

  /// \brief An interface for accessing the serialized form of an AuxData
  /// instance.
  ///
  /// The \ref const_aux_data_iterator provides this value type for
  /// the AuxData instances contained in this container. This provides
  /// access to all AuxData present in a container regardless of
  /// whether or not appropriate types have been registered.
  ///
  /// The content provided through this interface is only ever
  /// populated at the point at which this container is
  /// unserialized. Edits to AuxData after this point (or newly added
  /// AuxData) will not be reflected through this interface.
  struct AuxDataRaw {

    /// \brief The string name of the AuxData field.
    const std::string& Key;

    /// \brief The raw bytes of the serialized form of the AuxData
    const std::string& RawBytes;

    /// \brief The type of the AuxData as stored in protobuf.
    ///
    /// Note that this is not the AuxData's C++ type.
    const std::string& ProtobufType;

    AuxDataRaw(const std::string& K, const std::string& RB,
               const std::string& PT)
        : Key(K), RawBytes(RB), ProtobufType(PT) {}
  };

private:
  struct AccessRawData {
    auto operator()(const AuxDataSet::value_type& P) const {
      return AuxDataRaw(P.first, P.second->rawData().RawBytes,
                        P.second->rawData().ProtobufType);
    }
  };

public:
  /// \brief An iterator type for traversing the AuxData in this container.
  ///
  /// The value type for this iterator is AuxDataRaw. The iterator
  /// provides access to the serialized form of all AuxData in this
  /// container (regardless of whether or not the AuxData's type is
  /// registered.) Note that the content is only valid with respect to
  /// the most recent unserialization operation. Entries for new or
  /// modified AuxData entities will contain empty or stale content.
  using const_aux_data_iterator =
      boost::transform_iterator<AccessRawData, AuxDataSet::const_iterator>;
  using const_aux_data_range = boost::iterator_range<const_aux_data_iterator>;

  /// \brief Return a constant iterator to the first AuxData.
  const_aux_data_iterator aux_data_begin() const {
    return const_aux_data_iterator(AuxDatas.begin(), AccessRawData());
  }

  /// \brief Return a constant iterator to the element following the last
  /// AuxData.
  const_aux_data_iterator aux_data_end() const {
    return const_aux_data_iterator(AuxDatas.end(), AccessRawData());
  }

  /// \brief Return a constant range of the auxiliary data (\ref AuxData).
  const_aux_data_range aux_data() const {
    return boost::make_iterator_range(aux_data_begin(), aux_data_end());
  }

  /// \brief Get the total number of \ref AuxData objects in this IR.
  ///
  /// \return     The total number of \ref AuxData objects.
  ///
  size_t getAuxDataSize() const { return AuxDatas.size(); }

  /// \brief Check: Is the number of \ref AuxData objects in this IR zero?
  ///
  /// \return \c true if this IR does not contain any \ref AuxData, otherwise \c
  /// false
  ///
  bool getAuxDataEmpty() const { return AuxDatas.empty(); }

  /// \brief Clear all \ref AuxData from the IR.
  ///
  /// \return void
  ///
  void clearAuxData() { AuxDatas.clear(); }

  /// @}
  /// @cond INTERNAL

  /// \brief Serialize the aux data into a protobuf message.
  ///
  /// \param[out] Message   Serialize into this message.
  ///
  /// \return void
  template <
      class MessageType,
      class = std::enable_if_t<message_has_aux_data_container_v<MessageType>>>
  void toProtobuf(MessageType* Message) const {
    containerToProtobuf(this->AuxDatas, Message->mutable_aux_data());
  }

  /// \brief Load the aux data from a protobuf message.
  ///
  /// \param Message  The protobuf message from which to deserialize.
  ///
  /// \return void
  template <
      class MessageType,
      class = std::enable_if_t<message_has_aux_data_container_v<MessageType>>>
  void fromProtobuf(const MessageType& Message) {
    this->AuxDatas.clear();
    for (const auto& M : Message.aux_data()) {
      std::unique_ptr<AuxData> Val;
      std::string Key = M.first;

      // See if the name for this AuxData is registered.
      if (const auto* ADT = lookupAuxDataType(Key)) {
        Val = ADT->fromProtobuf(M.second);
      }

      // If it wasn't registered or was registered with an incompatible
      // type wrt the serialized object, unserialized as just the
      // un-typed raw data.
      if (!Val) {
        Val = std::make_unique<AuxData>();
        AuxData::fromProtobuf(*Val, M.second);
      }
      this->AuxDatas.insert(std::make_pair(Key, std::move(Val)));
    }
    /// @endcond
  }

protected:
  AuxDataContainer(Context& C, Kind knd);
  AuxDataContainer(Context& C, Kind knd, const UUID& U);

private:
  AuxDataSet AuxDatas;

  struct AuxDataType {
    virtual ~AuxDataType() = default;
    virtual std::unique_ptr<AuxData>
    fromProtobuf(const proto::AuxData& Message) const = 0;
    virtual std::size_t getApiTypeId() const = 0;
  };

  template <typename Schema> struct AuxDataTypeImpl : public AuxDataType {
    std::unique_ptr<AuxData>
    fromProtobuf(const proto::AuxData& Message) const override {
      return AuxDataImpl<Schema>::fromProtobuf(Message);
    }

    std::size_t getApiTypeId() const override {
      return AuxDataImpl<Schema>::staticGetApiTypeId();
    }
  };

  static void registerAuxDataTypeInternal(const char* Name,
                                          std::unique_ptr<AuxDataType> ADT);
  static bool checkAuxDataRegistration(const char* Name, std::size_t Id);
  static const AuxDataType* lookupAuxDataType(const std::string& Name);
  friend struct AuxDataTypeMap; // Allows AuxDataTypeMap to use AuxDataType
};
} // namespace gtirb
#endif // GTIRB_AUXDATACONTAINER_H


================================================
FILE: include/gtirb/AuxDataSchema.hpp
================================================
//===- AuxDataSchema.hpp ---------------------------------------------*-
// C++-*-===//
//
//  Copyright (C) 2018-2019 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
#ifndef GTIRB_AUXDATASCHEMA_HPP
#define GTIRB_AUXDATASCHEMA_HPP

#include <gtirb/Addr.hpp>
#include <gtirb/Context.hpp> // UUID
#include <gtirb/Offset.hpp>
#include <cstdint>
#include <map>
#include <set>
#include <string>

/// \file AuxDataSchema.hpp
/// \ingroup AUXDATA_GROUP
/// \brief  Type schema for sanctioned AuxData types
/// \see AUXDATA_GROUP

namespace gtirb {
namespace schema {

/// \brief Schema class for functionBlocks auxiliary data.
struct FunctionBlocks {
  static constexpr const char* Name = "functionBlocks";
  typedef std::map<gtirb::UUID, std::set<gtirb::UUID>> Type;
};

/// \brief Schema class for functionEntries auxiliary data.
struct FunctionEntries {
  static constexpr const char* Name = "functionEntries";
  typedef std::map<gtirb::UUID, std::set<gtirb::UUID>> Type;
};

/// \brief Schema class for functionNames auxiliary data.
struct FunctionNames {
  static constexpr const char* Name = "functionNames";
  typedef std::map<gtirb::UUID, gtirb::UUID> Type;
};

/// \brief Schema class for types auxiliary data.
struct Types {
  static constexpr const char* Name = "types";
  typedef std::map<gtirb::UUID, std::string> Type;
};

/// \brief Schema class for alignment auxiliary data.
struct Alignment {
  static constexpr const char* Name = "alignment";
  typedef std::map<gtirb::UUID, uint64_t> Type;
};

/// \brief Schema class for comments auxiliary data.
struct Comments {
  static constexpr const char* Name = "comments";
  typedef std::map<gtirb::Offset, std::string> Type;
};

/// \brief Schema class for symbolForwarding auxiliary data.
struct SymbolForwarding {
  static constexpr const char* Name = "symbolForwarding";
  typedef std::map<gtirb::UUID, gtirb::UUID> Type;
};

/// \brief Schema class for padding auxiliary data.
struct Padding {
  static constexpr const char* Name = "padding";
  typedef std::map<gtirb::Offset, uint64_t> Type;
};

/// \brief Schema class for ELF file's dynamic entry DT_INIT.
/// It contains a CodeBlock's UUID.
struct ElfDynamicInit {
  static constexpr const char* Name = "elfDynamicInit";
  typedef gtirb::UUID Type;
};

/// \brief Schema class for ELF file's dynamic entry DT_FINI.
/// It contains a CodeBlock's UUID.
struct ElfDynamicFini {
  static constexpr const char* Name = "elfDynamicFini";
  typedef gtirb::UUID Type;
};

/// \brief Schema class for ELF file's dynamic entry DT_SONAME.
/// It contains a SONAME as string
struct ElfSoname {
  static constexpr const char* Name = "elfSoname";
  typedef std::string Type;
};

/// \brief Schema class for stack executable flag specified by PT_GNU_STACK
/// segment in ELF files.
struct ElfStackExec {
  static constexpr const char* Name = "elfStackExec";
  typedef bool Type;
};

/// \brief Schema class for the size of the PT_GNU_STACK segment in ELF files,
/// which may influence the runtime stack size in certain environments.
struct ElfStackSize {
  static constexpr const char* Name = "elfStackSize";
  typedef uint64_t Type;
};

} // namespace schema

namespace provisional_schema {

/// \brief Schema class for profile aux data.
struct Profile {
  static constexpr const char* Name = "profile";
  typedef std::map<gtirb::Offset, uint64_t> Type;
};

/// Version identifiers are 16 bit unsigned integers.
using SymbolVersionId = uint16_t;
/// Map from version identifiers to version definitions. These correspond
/// to ELFxx_Verdef entries in the ELF section .gnu.version_d.
/// The values in the map are tuples containing the list of versions strings and
/// the verdef flags. The verdef flag may be VER_FLG_BASE (0x1), which indicates
/// that the given version definiton is the file itself, and must not be
/// used for matching a symbol. The first element of the list is the version
/// itself, the subsequent elements are predecessor versions.
using ElfSymVerDefs =
    std::map<SymbolVersionId, std::tuple<std::vector<std::string>, uint16_t>>;
/// Map from dynamic library names to the symbol versions that they need.
/// For each library, we have a map from version identifiers to version strings.
using ElfSymVerNeeded =
    std::map<std::string, std::map<SymbolVersionId, std::string>>;
//// Map from gtirb::Symbol UUIDs to a tuple of symbol version identifier and
/// hidden attribute.
using ElfSymbolVersionsEntries =
    std::map<gtirb::UUID, std::tuple<SymbolVersionId, bool>>;

/// \brief Auxiliary data for ELF symbol versions.
/// This includes the symbol version definitions, the symbol version
/// requirements, and the mapping from symbols to symbol versions.
struct ElfSymbolVersions {
  static constexpr const char* Name = "elfSymbolVersions";
  typedef std::tuple<ElfSymVerDefs, ElfSymVerNeeded, ElfSymbolVersionsEntries>
      Type;
};

} // namespace provisional_schema
} // namespace gtirb

#endif // GTIRB_AUXDATASCHEMA_HPP


================================================
FILE: include/gtirb/ByteInterval.hpp
================================================
//===- ByteInterval.hpp -----------------------------------------*- C++ -*-===//
//
//  Copyright (C) 2020 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//

#ifndef GTIRB_BYTE_INTERVAL_H
#define GTIRB_BYTE_INTERVAL_H

#include <gtirb/DecodeMode.hpp>
#include <gtirb/Export.hpp>
#include <gtirb/Node.hpp>
#include <gtirb/Observer.hpp>
#include <gtirb/SymbolicExpression.hpp>
#include <gtirb/Utility.hpp>
#include <array>
#include <boost/endian/conversion.hpp>
#include <boost/icl/interval_map.hpp>
#include <boost/iterator/filter_iterator.hpp>
#include <boost/iterator/indirect_iterator.hpp>
#include <boost/iterator/iterator_categories.hpp>
#include <boost/iterator/iterator_facade.hpp>
#include <boost/iterator/iterator_traits.hpp>
#include <boost/iterator/transform_iterator.hpp>
#include <boost/multi_index/hashed_index.hpp>
#include <boost/multi_index/identity.hpp>
#include <boost/multi_index/key_extractors.hpp>
#include <boost/multi_index/mem_fun.hpp>
#include <boost/multi_index/ordered_index.hpp>
#include <boost/multi_index_container.hpp>
#include <boost/range/iterator_range.hpp>
#include <cstdint>
#include <functional>
#include <map>
#include <optional>
#include <type_traits>
#include <variant>
#include <vector>

/// \file ByteInterval.hpp
/// \brief Class gtirb::ByteInterval.

namespace gtirb {
namespace proto {
class ByteInterval;
} // namespace proto

class Section;   // Forward declared for the backpointer.
class CodeBlock; // Forward declared so Blocks can store CodeBlocks.
class DataBlock; // Forward declared so Blocks can store DataBlocks.
class ByteIntervalObserver;

template <class T> class ErrorOr;

///
/// \brief Interface for notifying observers when a CodeBlock is modified.
///

class GTIRB_EXPORT_API CodeBlockObserver {
public:
  virtual ~CodeBlockObserver() = default;

  /// \brief Notify the parent when the CodeBlock changes size.
  ///
  /// Called after the CodeBlock updates its internal state.
  ///
  /// \param B        the CodeBlock that changed.
  /// \param OldSize  the previous size of the CodeBlock.
  /// \param NewSize  the new size of the CodeBlock.
  ///
  /// \return indication of whether the observer accepts the change.
  virtual ChangeStatus sizeChange(CodeBlock* B, uint64_t OldSize,
                                  uint64_t NewSize) = 0;
  /// \brief Notify the parent when the CodeBlock's decode mode changes.
  ///
  /// Called after the CodeBlock updates its internal state.
  virtual ChangeStatus decodeModeChange(CodeBlock* B, DecodeMode OldMode,
                                        DecodeMode NewMode) = 0;
};

///
/// \brief Interface for notifying observers when a DataBlock is modified.
///

class GTIRB_EXPORT_API DataBlockObserver {
public:
  virtual ~DataBlockObserver() = default;

  /// \brief Notify the parent when the DataBlock changes size.
  ///
  /// Called after the DataBlock updates its internal state.
  ///
  /// \param B        the DataBlock that changed.
  /// \param OldSize  the previous size of the DataBlock.
  /// \param NewSize  the new size of the DataBlock.
  ///
  /// \return indication of whether the observer accepts the change.
  virtual ChangeStatus sizeChange(DataBlock* B, uint64_t OldSize,
                                  uint64_t NewSize) = 0;
};

/// \class ByteInterval
///
/// \brief A contiguous region of bytes in a binary.
///
/// A ByteInterval defines a relative ordering for a group of \ref Block
/// objects, optionally at a fixed address in memory. It also stores the bytes
/// associated with these blocks.
///
/// If two blocks are in two different ByteIntervals, then it should be
/// considered safe (that is, preserving of program semantics) to move one block
/// relative to the other in memory. If two blocks are in the same ByteInterval,
/// then it should be considered unknown if moving the two blocks relative to
/// one another in memory is a safe operation.
class GTIRB_EXPORT_API ByteInterval : public Node {
  /// \class Block
  ///
  /// \brief A node (either a \ref CodeBlock or \ref DataBlock), alongside an
  /// offset, held within this interval.
  struct Block {
    uint64_t Offset;
    gtirb::Node* Node;

    Block(uint64_t Off, gtirb::Node* N) : Offset(Off), Node(N) {}

    /// \brief Get the offset from the beginning of this block's \ref
    /// ByteInterval.
    uint64_t getOffset() const { return Offset; }

    /// \brief Get the \ref Node, either a \ref CodeBlock or \ref DataBlock, in
    /// the \ref ByteInterval.
    ///
    /// This function returns a nonconst pointer despite being const
    /// because it's valid to mutate the nodes, but not valid to mutate the
    /// block-offset pairs in the BlockSet.
    gtirb::Node* getNode() const { return Node; }
  };

  /// \class BlockKindEquals
  ///
  /// \brief A predicate object to discern one type of block.
  ///
  /// This predicate does not interact with the subclassing system;
  /// BlockKindEquals<Node::Kind::CfgNode> will not identify any blocks as CFG
  /// nodes, for example.
  template <Node::Kind K> struct BlockKindEquals {
    bool operator()(const Block& B) const {
      return B.getNode()->getKind() == K;
    }
  };

  /// \class BlockToNode
  ///
  /// \brief A function for a transform iterator to turn blocks into nodes.
  template <typename NodeType> struct BlockToNode {
    BlockToNode() {}

    /// \brief Non-const to const conversion constructor.
    BlockToNode(const BlockToNode<std::remove_const_t<NodeType>>&) {}

    BlockToNode& operator=(const BlockToNode<std::remove_const_t<NodeType>>&) {
      return *this;
    }

    NodeType& operator()(const Block& B) const {
      // We avoid the call to cast() here because we use this function after
      // BlockKindEquals, which confirms the type of the Node for us
      // (and more importantly, we avoid having to include Code/DataBlock).
      return *reinterpret_cast<NodeType*>(B.Node);
    }

    NodeType& operator()(const Block* B) const { return *B->Node; }
  };

  /// \class BlockOffsetLess
  ///
  /// \brief Provides a comparison for Block using the common functionality
  ///        in Utility.hpp by adapting from the internal Block type a pair of
  ///        offset and node.
  struct GTIRB_EXPORT_API BlockOffsetLess {
    bool operator()(const Block* B1, const Block* B2) const {
      return BlockOffsetPairLess()({B1->Offset, B1->Node},
                                   {B2->Offset, B2->Node});
    }
    bool operator()(const Block& B1, const Block& B2) const {
      return operator()(&B1, &B2);
    }
  };

  /// \class OffsetCmp
  ///
  /// \brief A comparison object that allows searching in the block set by
  ///        offset.
  struct GTIRB_EXPORT_API OffsetCmp {
    bool operator()(uint64_t Offset, const Block& B) const {
      return Offset < B.Offset;
    }
    bool operator()(const Block& B, uint64_t Offset) const {
      return B.Offset < Offset;
    }
  };

  struct by_offset {};
  struct by_pointer {};
  using BlockSet = boost::multi_index::multi_index_container<
      Block, boost::multi_index::indexed_by<
                 boost::multi_index::ordered_non_unique<
                     boost::multi_index::tag<by_offset>,
                     boost::multi_index::identity<Block>, BlockOffsetLess>,
                 boost::multi_index::hashed_unique<
                     boost::multi_index::tag<by_pointer>,
                     boost::multi_index::const_mem_fun<Block, Node*,
                                                       &Block::getNode>>>>;
  using BlockIntMap =
      boost::icl::interval_map<uint64_t,
                               std::multiset<const Block*, BlockOffsetLess>>;
  using SymbolicExpressionMap = std::map<uint64_t, SymbolicExpression>;

  /// \brief Get the \ref Block that corresponds to a \ref Node.
  const Block& nodeToBlock(const Node* N) const {
    auto& Index = Blocks.get<by_pointer>();
    auto It = Index.find(const_cast<Node*>(N));
    assert(It != Index.end() &&
           "ByteInterval::nodeToBlock called with block not in interval");
    return *It;
  }

  class CodeBlockObserverImpl;
  class DataBlockObserverImpl;

  /// \brief Updates the interval map for a node by removing and re-inserting
  ///        the interval. Must be called when either the block's offset or
  ///        size changes.
  /// \param N         The Block that needs updating
  /// \param OldSize   The previous size of the block. If specified this will
  ///                  cause the entry to be removed from the map.
  /// \param NewSize   The new size of the block. If specified this will cause
  ///                  the entry to be added to the map.
  void updateIntervalMap(Node* N, std::optional<uint64_t> OldSize,
                         std::optional<uint64_t> NewSize);
  /// \brief Updates the block's sorted index. Must be called whenever a
  ///        block's sort order would change.
  void updateBlockSortOrder(Node* N);

  ChangeStatus sizeChange(Node* N, uint64_t OldSize, uint64_t NewSize);
  ChangeStatus decodeModeChange(CodeBlock* B, DecodeMode OldMode,
                                DecodeMode NewMode);

public:
  /// \brief Create an unitialized ByteInterval object.
  /// \param C        The Context in which this ByteInterval will be held.
  /// \return         The newly created ByteInterval.
  static ByteInterval* Create(Context& C) { return C.Create<ByteInterval>(C); }

  /// \brief Create a ByteInterval object.
  ///
  /// \param C         The \ref Context in which this interval will be held.
  /// \param Size      The size of this interval in bytes.
  /// \param InitSize  The number of bytes with initialized values. Defaults
  ///                  to the value of Size.
  /// \return          The newly created ByteInterval.
  static ByteInterval* Create(Context& C, uint64_t Size,
                              std::optional<uint64_t> InitSize = std::nullopt) {
    return C.Create<ByteInterval>(C, std::nullopt, Size,
                                  InitSize.value_or(Size));
  }

  /// \brief Create a ByteInterval object.
  ///
  /// \param C         The \ref Context in which this interval will be held.
  /// \param Address   An (optional) fixed address for this interval.
  /// \param Size      The size of this interval in bytes.
  /// \param InitSize  The number of bytes with initialized values. Defaults
  ///                  to the value of Size.
  /// \return          The newly created ByteInterval.
  static ByteInterval* Create(Context& C, std::optional<Addr> Address,
                              uint64_t Size = 0,
                              std::optional<uint64_t> InitSize = std::nullopt) {
    return C.Create<ByteInterval>(C, Address, Size, InitSize.value_or(Size));
  }

  /// \brief Create a ByteInterval object.
  ///
  /// \tparam InputIterator An input iterator yielding bytes.
  /// \param C          The \ref Context in which this interval will be held.
  /// \param BytesBegin The start of the range to copy to the byte vector.
  /// \param BytesEnd   The end of the range to copy to the byte vector.
  /// \param Size       The size of this interval in bytes. Defaults to the
  ///                   size of the range of bytes. If specified, either
  ///                   trucates the range of bytes given or pads it at the end
  ///                   with zeroes.
  /// \param InitSize   The number of bytes with initialized values. Defaults to
  ///                   the size of the range of bytes. If specified, does NOT
  ///                   zero out values from the range past this number.
  /// \return           The newly created ByteInterval.
  template <typename InputIterator>
  static ByteInterval* Create(Context& C, InputIterator Begin,
                              InputIterator End,
                              std::optional<uint64_t> Size = std::nullopt,
                              std::optional<uint64_t> InitSize = std::nullopt) {
    return C.Create<ByteInterval>(
        C, std::nullopt, Size ? *Size : std::distance(Begin, End),
        InitSize ? *InitSize : std::distance(Begin, End), Begin, End);
  }

  /// \brief Create a ByteInterval object.
  ///
  /// \tparam InputIterator An input iterator yielding bytes.
  /// \param C          The \ref Context in which this interval will be held.
  /// \param Address    An (optional) fixed address for this interval.
  /// \param BytesBegin The start of the range to copy to the byte vector.
  /// \param BytesEnd   The end of the range to copy to the byte vector.
  /// \param Size       The size of this interval in bytes. Defaults to the
  ///                   size of the range of bytes. If specified, either
  ///                   trucates the range of bytes given or pads it at the end
  ///                   with zeroes.
  /// \param InitSize   The number of bytes with initialized values. Defaults to
  ///                   the size of the range of bytes. If specified, does NOT
  ///                   zero out values from the range past this number.
  /// \return           The newly created ByteInterval.
  template <typename InputIterator>
  static ByteInterval* Create(Context& C, std::optional<Addr> Address,
                              InputIterator Begin, InputIterator End,
                              std::optional<uint64_t> Size = std::nullopt,
                              std::optional<uint64_t> InitSize = std::nullopt) {
    return C.Create<ByteInterval>(
        C, Address, Size ? *Size : std::distance(Begin, End),
        InitSize ? *InitSize : std::distance(Begin, End), Begin, End);
  }

  /// \brief Get the \ref Section this byte interval belongs to.
  Section* getSection() { return Parent; }
  /// \brief Get the \ref Section this byte interval belongs to.
  const Section* getSection() const { return Parent; }

  /// \brief Get the fixed address of this interval, if present.
  ///
  /// If this field is present, it may indicate the original address at which
  /// this interval was located at in memory, or it may indicate that this
  /// block's address is fixed and must not be changed. If this field is not
  /// present, it indicates that the interval is free to be moved around in
  /// memory while preserving program semantics.
  std::optional<Addr> getAddress() const { return Address; }

  /// \brief Iterator over \ref Block objects.
  ///
  /// Blocks are yielded in offset order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".

  using block_iterator =
      boost::transform_iterator<BlockToNode<Node>,
                                BlockSet::index<by_offset>::type::iterator>;
  /// \brief Range of \ref Block objects.
  ///
  /// Blocks are yielded in offset order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".
  using block_range = boost::iterator_range<block_iterator>;
  /// \brief Sub-range of blocks overlapping an address or range of addreses.
  ///
  /// Blocks are yielded in offset order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".
  using block_subrange = boost::iterator_range<boost::transform_iterator<
      BlockToNode<Node>, BlockIntMap::codomain_type::iterator>>;
  /// \brief Const iterator over \ref Block objects.
  ///
  /// Blocks are yielded in offset order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".
  using const_block_iterator = boost::transform_iterator<
      BlockToNode<const Node>,
      BlockSet::index<by_offset>::type::const_iterator>;
  /// \brief Const range of \ref Block objects.
  ///
  /// Blocks are yielded in offset order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".
  using const_block_range = boost::iterator_range<const_block_iterator>;
  /// \brief Const sub-range of blocks overlapping an address or range of
  /// addreses.
  ///
  /// Blocks are yielded in offset order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".
  using const_block_subrange = boost::iterator_range<boost::transform_iterator<
      BlockToNode<const Node>, BlockIntMap::codomain_type::const_iterator>>;

  /// \brief Return an iterator to the first \ref Block.
  block_iterator blocks_begin() { return block_iterator(Blocks.begin()); }
  /// \brief Return a const iterator to the first \ref Block.
  const_block_iterator blocks_begin() const {
    return const_block_iterator(Blocks.begin());
  }
  /// \brief Return an iterator to the element following the last \ref Block.
  block_iterator blocks_end() { return block_iterator(Blocks.end()); }
  /// \brief Return a const iterator to the element following the last
  /// \ref Block.
  const_block_iterator blocks_end() const {
    return const_block_iterator(Blocks.end());
  }
  /// \brief Return a range of the \ref Block objects in this interval.
  block_range blocks() {
    return boost::make_iterator_range(blocks_begin(), blocks_end());
  }
  /// \brief Return a const range of the \ref Block objects in this interval.
  const_block_range blocks() const {
    return boost::make_iterator_range(blocks_begin(), blocks_end());
  }

  /// \brief Find all the blocks that have a byte at the specified offset.
  ///
  /// \param Off The offset to look up.
  ///
  /// \return A range of \ref Node objects, which are either \ref DataBlock or
  /// \ref CodeBlock objects, that contain the offset \p Off.
  block_subrange findBlocksOnOffset(uint64_t Off) {
    if (auto It = BlockOffsets.find(Off); It != BlockOffsets.end()) {
      return block_subrange(It->second.begin(), It->second.end());
    }
    return {};
  }

  /// \brief Find all the blocks that have a byte at the specified offset.
  ///
  /// \param Off The offset to look up.
  ///
  /// \return A range of \ref Node objects, which are either \ref DataBlock or
  /// \ref CodeBlock objects, that contain the offset \p Off.
  const_block_subrange findBlocksOnOffset(uint64_t Off) const {
    if (auto It = BlockOffsets.find(Off); It != BlockOffsets.end()) {
      return const_block_subrange(It->second.begin(), It->second.end());
    }
    return {};
  }

  /// \brief Find all the blocks that have bytes that lie within the address
  /// specified.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref Node objects, which are either \ref DataBlock
  /// objects or \ref CodeBlock objects, that intersect the address \p A.
  block_subrange findBlocksOn(Addr A) {
    if (Address) {
      return findBlocksOnOffset(A - *Address);
    }
    return {};
  }

  /// \brief Find all the blocks that have bytes that lie within the address
  /// specified.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref Node objects, which are either \ref DataBlock
  /// objects or \ref CodeBlock objects, that intersect the address \p A.
  const_block_subrange findBlocksOn(Addr A) const {
    if (Address) {
      return findBlocksOnOffset(A - *Address);
    }
    return {};
  }

  /// \brief Find all the blocks that start at an offset.
  ///
  /// \param Off The offset to look up.
  ///
  /// \return A range of \ref Node objects, which are either \ref DataBlock
  /// objects or \ref CodeBlock objects, that are at the offset \p Off.
  block_range findBlocksAtOffset(uint64_t Off) {
    auto Pair = Blocks.get<by_offset>().equal_range(Off, OffsetCmp());
    return boost::make_iterator_range(block_iterator(Pair.first),
                                      block_iterator(Pair.second));
  }

  /// \brief Find all the blocks that start between a range of offsets.
  ///
  /// \param Low  The low offset, inclusive.
  /// \param High The high offset, exclusive.
  ///
  /// \return A range of \ref Node objects, which are either \ref DataBlock
  /// objects or \ref CodeBlock objects, that are between the offsets.
  block_range findBlocksAtOffset(uint64_t Low, uint64_t High) {
    auto& Index = Blocks.get<by_offset>();
    auto LowIt = Index.lower_bound(Low, OffsetCmp());
    auto HighIt = Index.lower_bound(std::max(Low, High), OffsetCmp());
    return boost::make_iterator_range(block_iterator(LowIt),
                                      block_iterator(HighIt));
  }

  /// \brief Find all the blocks that start at an address.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref Node objects, which are either \ref DataBlock
  /// objects or \ref CodeBlock objects, that are at the address \p A.
  block_range findBlocksAt(Addr A) {
    if (!Address || A < *Address) {
      // Return an empty range without default-constructing the iterators.
      return findBlocksAtOffset(0, 0);
    }
    return findBlocksAtOffset(A - *Address);
  }

  /// \brief Find all the blocks that start between a range of addresses.
  ///
  /// \param Low  The low address, inclusive.
  /// \param High The high address, exclusive.
  ///
  /// \return A range of \ref Node objects, which are either \ref DataBlock
  /// objects or \ref CodeBlock objects, that are between the addresses.
  block_range findBlocksAt(Addr Low, Addr High) {
    if (!Address) {
      // Return an empty range without default-constructing the iterators.
      return findBlocksAtOffset(0, 0);
    }
    return findBlocksAtOffset(Low - std::min(*Address, Low),
                              High - std::min(*Address, High));
  }

  /// \brief Find all the blocks that start at an offset.
  ///
  /// \param Off The offset to look up.
  ///
  /// \return A range of \ref Node objects, which are either \ref DataBlock
  /// objects or \ref CodeBlock objects, that are at the offset \p Off.
  const_block_range findBlocksAtOffset(uint64_t Off) const {
    auto Pair = Blocks.get<by_offset>().equal_range(Off, OffsetCmp());
    return boost::make_iterator_range(const_block_iterator(Pair.first),
                                      const_block_iterator(Pair.second));
  }

  /// \brief Find all the blocks that start between a range of offsets.
  ///
  /// \param Low  The low offset, inclusive.
  /// \param High The high offset, exclusive.
  ///
  /// \return A range of \ref Node objects, which are either \ref DataBlock
  /// objects or \ref CodeBlock objects, that are between the offsets.
  const_block_range findBlocksAtOffset(uint64_t Low, uint64_t High) const {
    auto& Index = Blocks.get<by_offset>();
    auto LowIt = Index.lower_bound(Low, OffsetCmp());
    auto HighIt = Index.lower_bound(std::max(Low, High), OffsetCmp());
    return boost::make_iterator_range(const_block_iterator(LowIt),
                                      const_block_iterator(HighIt));
  }

  /// \brief Find all the blocks that start at an address.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref Node objects, which are either \ref DataBlock
  /// objects or \ref CodeBlock objects, that are at the address \p A.
  const_block_range findBlocksAt(Addr A) const {
    if (!Address || A < *Address) {
      // Return an empty range without default-constructing the iterators.
      return findBlocksAtOffset(0, 0);
    }
    return findBlocksAtOffset(A - *Address);
  }

  /// \brief Find all the blocks that start between a range of addresses.
  ///
  /// \param Low  The low address, inclusive.
  /// \param High The high address, exclusive.
  ///
  /// \return A range of \ref Node objects, which are either \ref DataBlock
  /// objects or \ref CodeBlock objects, that are between the addresses.
  const_block_range findBlocksAt(Addr Low, Addr High) const {
    if (!Address) {
      // Return an empty range without default-constructing the iterators.
      return findBlocksAtOffset(0, 0);
    }
    return findBlocksAtOffset(Low - std::min(*Address, Low),
                              High - std::min(*Address, High));
  }

  /// \brief Iterator over \ref CodeBlock objects.
  ///
  /// Blocks are yielded in offset order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".
  using code_block_iterator = boost::transform_iterator<
      BlockToNode<CodeBlock>,
      boost::filter_iterator<BlockKindEquals<Node::Kind::CodeBlock>,
                             BlockSet::index<by_offset>::type::iterator>>;
  /// \brief Range of \ref CodeBlock objects.
  ///
  /// Blocks are yielded in offset order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".
  using code_block_range = boost::iterator_range<code_block_iterator>;
  /// \brief Sub-range of code blocks overlapping an address or range of
  /// addreses.
  ///
  /// Blocks are yielded in offset order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".
  using code_block_subrange = boost::iterator_range<boost::transform_iterator<
      BlockToNode<CodeBlock>,
      boost::filter_iterator<
          BlockKindEquals<Node::Kind::CodeBlock>,
          boost::indirect_iterator<BlockIntMap::codomain_type::iterator>>>>;
  /// \brief Const iterator over \ref CodeBlock objects.
  ///
  /// Blocks are yielded in offset order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".
  using const_code_block_iterator = boost::transform_iterator<
      BlockToNode<const CodeBlock>,
      boost::filter_iterator<BlockKindEquals<Node::Kind::CodeBlock>,
                             BlockSet::index<by_offset>::type::const_iterator>>;
  /// \brief Const range of \ref CodeBlock objects.
  ///
  /// Blocks are yielded in offset order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".
  using const_code_block_range =
      boost::iterator_range<const_code_block_iterator>;
  /// \brief Const sub-range of code blocks overlapping an address or range of
  /// addreses.
  ///
  /// Blocks are yielded in offset order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".
  using const_code_block_subrange =
      boost::iterator_range<boost::transform_iterator<
          BlockToNode<const CodeBlock>,
          boost::filter_iterator<
              BlockKindEquals<Node::Kind::CodeBlock>,
              boost::indirect_iterator<
                  BlockIntMap::codomain_type::const_iterator>>>>;

  /// \brief Return an iterator to the first \ref CodeBlock.
  code_block_iterator code_blocks_begin() {
    return code_block_iterator(
        code_block_iterator::base_type(Blocks.begin(), Blocks.end()));
  }
  /// \brief Return a const iterator to the first \ref CodeBlock.
  const_code_block_iterator code_blocks_begin() const {
    return const_code_block_iterator(
        const_code_block_iterator::base_type(Blocks.begin(), Blocks.end()));
  }
  /// \brief Return an iterator to the element following the last \ref
  /// CodeBlock.
  code_block_iterator code_blocks_end() {
    return code_block_iterator(
        code_block_iterator::base_type(Blocks.end(), Blocks.end()));
  }
  /// \brief Return a const iterator to the element following the last \ref
  /// CodeBlock.
  const_code_block_iterator code_blocks_end() const {
    return const_code_block_iterator(
        const_code_block_iterator::base_type(Blocks.end(), Blocks.end()));
  }
  /// \brief Return a range of the \ref CodeBlock objects in this interval.
  code_block_range code_blocks() {
    return boost::make_iterator_range(code_blocks_begin(), code_blocks_end());
  }
  /// \brief Return a const range of the \ref CodeBlock objects in this
  /// interval.
  const_code_block_range code_blocks() const {
    return boost::make_iterator_range(code_blocks_begin(), code_blocks_end());
  }

  /// \brief Find all the code blocks that have a byte at the specified offset.
  ///
  /// \param Off The offset to look up.
  ///
  /// \return A range of \ref CodeBlock objects, that contain the offset \p Off.
  code_block_subrange findCodeBlocksOnOffset(uint64_t Off) {
    if (auto It = BlockOffsets.find(Off); It != BlockOffsets.end()) {
      auto End = boost::make_indirect_iterator(It->second.end());
      return code_block_subrange(
          code_block_subrange::iterator::base_type(
              boost::make_indirect_iterator(It->second.begin()), End),
          code_block_subrange::iterator::base_type(End, End));
    }
    return {};
  }

  /// \brief Find all the code blocks that have a byte at the specified offset.
  ///
  /// \param Off The offset to look up.
  ///
  /// \return A range of \ref CodeBlock objects, that contain the addres \p Off.
  const_code_block_subrange findCodeBlocksOnOffset(uint64_t Off) const {
    if (auto It = BlockOffsets.find(Off); It != BlockOffsets.end()) {
      auto End = boost::make_indirect_iterator(It->second.end());
      return const_code_block_subrange(
          const_code_block_subrange::iterator::base_type(
              boost::make_indirect_iterator(It->second.begin()), End),
          const_code_block_subrange::iterator::base_type(End, End));
    }
    return {};
  }

  /// \brief Find all the code blocks that have bytes that lie within the
  /// address specified.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref CodeBlock objects that intersect the address \p A.
  code_block_subrange findCodeBlocksOn(Addr A) {
    if (Address) {
      return findCodeBlocksOnOffset(A - *Address);
    }
    return {};
  }

  /// \brief Find all the code blocks that have bytes that lie within the
  /// address specified.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref CodeBlock objects that intersect the address \p A.
  const_code_block_subrange findCodeBlocksOn(Addr A) const {
    if (Address) {
      return findCodeBlocksOnOffset(A - *Address);
    }
    return {};
  }

  /// \brief Find all the code blocks that start at an offset.
  ///
  /// \param Off The offset to look up.
  ///
  /// \return A range of \ref CodeBlock objects that are at the offset \p Off.
  code_block_range findCodeBlocksAtOffset(uint64_t Off) {
    auto Pair = Blocks.get<by_offset>().equal_range(Off, OffsetCmp());
    return boost::make_iterator_range(
        code_block_iterator(
            code_block_iterator::base_type(Pair.first, Pair.second)),
        code_block_iterator(
            code_block_iterator::base_type(Pair.second, Pair.second)));
  }

  /// \brief Find all the code blocks that start between a range of offsets.
  ///
  /// \param Low  The low offset, inclusive.
  /// \param High The high offset, exclusive.
  ///
  /// \return A range of \ref CodeBlock objects that are between the offsets.
  code_block_range findCodeBlocksAtOffset(uint64_t Low, uint64_t High) {
    auto& Index = Blocks.get<by_offset>();
    auto LowIt = Index.lower_bound(Low, OffsetCmp());
    auto HighIt = Index.lower_bound(std::max(Low, High), OffsetCmp());
    return boost::make_iterator_range(
        code_block_iterator(code_block_iterator::base_type(LowIt, HighIt)),
        code_block_iterator(code_block_iterator::base_type(HighIt, HighIt)));
  }

  /// \brief Find all the code blocks that start at an address.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref CodeBlock objects that are at the address \p A.
  code_block_range findCodeBlocksAt(Addr A) {
    if (!Address || A < *Address) {
      // Return an empty range without default-constructing the iterators.
      return findCodeBlocksAtOffset(0, 0);
    }
    return findCodeBlocksAtOffset(A - *Address);
  }

  /// \brief Find all the code blocks that start between a range of addresses.
  ///
  /// \param Low  The low address, inclusive.
  /// \param High The high address, exclusive.
  ///
  /// \return A range of \ref CodeBlock objects that are between the addresses.
  code_block_range findCodeBlocksAt(Addr Low, Addr High) {
    if (!Address) {
      // Return an empty range without default-constructing the iterators.
      return findCodeBlocksAtOffset(0, 0);
    }
    return findCodeBlocksAtOffset(Low - std::min(*Address, Low),
                                  High - std::min(*Address, High));
  }

  /// \brief Find all the code blocks that start at an offset.
  ///
  /// \param Off The offset to look up.
  ///
  /// \return A range of \ref CodeBlock objects that are at the offset \p Off.
  const_code_block_range findCodeBlocksAtOffset(uint64_t Off) const {
    auto Pair = Blocks.get<by_offset>().equal_range(Off, OffsetCmp());
    return boost::make_iterator_range(
        const_code_block_iterator(
            const_code_block_iterator::base_type(Pair.first, Pair.second)),
        const_code_block_iterator(
            const_code_block_iterator::base_type(Pair.second, Pair.second)));
  }

  /// \brief Find all the code blocks that start between a range of offsets.
  ///
  /// \param Low  The low offset, inclusive.
  /// \param High The high offset, exclusive.
  ///
  /// \return A range of \ref CodeBlock objects that are between the offsets.
  const_code_block_range findCodeBlocksAtOffset(uint64_t Low,
                                                uint64_t High) const {
    auto& Index = Blocks.get<by_offset>();
    auto LowIt = Index.lower_bound(Low, OffsetCmp());
    auto HighIt = Index.lower_bound(std::max(Low, High), OffsetCmp());
    return boost::make_iterator_range(
        const_code_block_iterator(
            const_code_block_iterator::base_type(LowIt, HighIt)),
        const_code_block_iterator(
            const_code_block_iterator::base_type(HighIt, HighIt)));
  }

  /// \brief Find all the code blocks that start at an address.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref CodeBlock objects that are at the address \p A.
  const_code_block_range findCodeBlocksAt(Addr A) const {
    if (!Address || A < *Address) {
      // Return an empty range without default-constructing the iterators.
      return findCodeBlocksAtOffset(0, 0);
    }
    return findCodeBlocksAtOffset(A - *Address);
  }

  /// \brief Find all the code blocks that start between a range of addresses.
  ///
  /// \param Low  The low address, inclusive.
  /// \param High The high address, exclusive.
  ///
  /// \return A range of \ref CodeBlock objects that are between the addresses.
  const_code_block_range findCodeBlocksAt(Addr Low, Addr High) const {
    if (!Address) {
      // Return an empty range without default-constructing the iterators.
      return findCodeBlocksAtOffset(0, 0);
    }
    return findCodeBlocksAtOffset(Low - std::min(*Address, Low),
                                  High - std::min(*Address, High));
  }

  /// \brief Iterator over \ref DataBlock objects.
  ///
  /// Blocks are yielded in offset order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".
  using data_block_iterator = boost::transform_iterator<
      BlockToNode<DataBlock>,
      boost::filter_iterator<BlockKindEquals<Node::Kind::DataBlock>,
                             BlockSet::index<by_offset>::type::iterator>>;
  /// \brief Range of \ref DataBlock objects.
  ///
  /// Blocks are yielded in offset order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".
  using data_block_range = boost::iterator_range<data_block_iterator>;
  /// \brief Sub-range of data blocks overlapping an address or range of
  /// addreses.
  ///
  /// Blocks are yielded in offset order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".
  using data_block_subrange = boost::iterator_range<boost::transform_iterator<
      BlockToNode<DataBlock>,
      boost::filter_iterator<
          BlockKindEquals<Node::Kind::DataBlock>,
          boost::indirect_iterator<BlockIntMap::codomain_type::iterator>>>>;
  /// \brief Const iterator over \ref DataBlock objects.
  ///
  /// Blocks are yielded in offset order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".
  using const_data_block_iterator = boost::transform_iterator<
      BlockToNode<const DataBlock>,
      boost::filter_iterator<BlockKindEquals<Node::Kind::DataBlock>,
                             BlockSet::index<by_offset>::type::const_iterator>>;
  /// \brief Const range of \ref DataBlock objects.
  ///
  /// Blocks are yielded in offset order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".
  using const_data_block_range =
      boost::iterator_range<const_data_block_iterator>;
  /// \brief Const sub-range of data blocks overlapping an address or range of
  /// addreses.
  ///
  /// Blocks are yielded in offset order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".
  using const_data_block_subrange =
      boost::iterator_range<boost::transform_iterator<
          BlockToNode<const DataBlock>,
          boost::filter_iterator<
              BlockKindEquals<Node::Kind::DataBlock>,
              boost::indirect_iterator<
                  BlockIntMap::codomain_type::const_iterator>>>>;

  /// \brief Return an iterator to the first \ref DataBlock.
  data_block_iterator data_blocks_begin() {
    return data_block_iterator(
        data_block_iterator::base_type(Blocks.begin(), Blocks.end()));
  }
  /// \brief Return a const iterator to the first \ref DataBlock.
  const_data_block_iterator data_blocks_begin() const {
    return const_data_block_iterator(
        const_data_block_iterator::base_type(Blocks.begin(), Blocks.end()));
  }
  /// \brief Return an iterator to the element following the last \ref
  /// DataBlock.
  data_block_iterator data_blocks_end() {
    return data_block_iterator(
        data_block_iterator::base_type(Blocks.end(), Blocks.end()));
  }
  /// \brief Return a const iterator to the element following the last \ref
  /// DataBlock.
  const_data_block_iterator data_blocks_end() const {
    return const_data_block_iterator(
        const_data_block_iterator::base_type(Blocks.end(), Blocks.end()));
  }
  /// \brief Return a range of the \ref DataBlock objects in this interval.
  data_block_range data_blocks() {
    return boost::make_iterator_range(data_blocks_begin(), data_blocks_end());
  }
  /// \brief Return a const range of the \ref DataBlock objects in this
  /// interval.
  const_data_block_range data_blocks() const {
    return boost::make_iterator_range(data_blocks_begin(), data_blocks_end());
  }

  /// \brief Find all the data blocks that have a byte at the specified offset.
  ///
  /// \param Off The offset to look up.
  ///
  /// \return A range of \ref DataBlock objects, that contain the offset \p Off.
  data_block_subrange findDataBlocksOnOffset(uint64_t Off) {
    if (auto It = BlockOffsets.find(Off); It != BlockOffsets.end()) {
      auto End = boost::make_indirect_iterator(It->second.end());
      return data_block_subrange(
          data_block_subrange::iterator::base_type(
              boost::make_indirect_iterator(It->second.begin()), End),
          data_block_subrange::iterator::base_type(End, End));
    }
    return {};
  }

  /// \brief Find all the data blocks that have a byte at the specified offset.
  ///
  /// \param Off The offset to look up.
  ///
  /// \return A range of \ref DataBlock objects, that contain the addres \p Off.
  const_data_block_subrange findDataBlocksOnOffset(uint64_t Off) const {
    if (auto It = BlockOffsets.find(Off); It != BlockOffsets.end()) {
      auto End = boost::make_indirect_iterator(It->second.end());
      return const_data_block_subrange(
          const_data_block_subrange::iterator::base_type(
              boost::make_indirect_iterator(It->second.begin()), End),
          const_data_block_subrange::iterator::base_type(End, End));
    }
    return {};
  }

  /// \brief Find all the data blocks that have bytes that lie within the
  /// address specified.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref DataBlock objects that intersect the address \p A.
  data_block_subrange findDataBlocksOn(Addr A) {
    if (Address) {
      return findDataBlocksOnOffset(A - *Address);
    }
    return {};
  }

  /// \brief Find all the data blocks that have bytes that lie within the
  /// address specified.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref DataBlock objects that intersect the address \p A.
  const_data_block_subrange findDataBlocksOn(Addr A) const {
    if (Address) {
      return findDataBlocksOnOffset(A - *Address);
    }
    return {};
  }

  /// \brief Find all the data blocks that start at an offset.
  ///
  /// \param Off The offset to look up.
  ///
  /// \return A range of \ref DataBlock objects that are at the offset \p Off.
  data_block_range findDataBlocksAtOffset(uint64_t Off) {
    auto Pair = Blocks.get<by_offset>().equal_range(Off, OffsetCmp());
    return boost::make_iterator_range(
        data_block_iterator(
            data_block_iterator::base_type(Pair.first, Pair.second)),
        data_block_iterator(
            data_block_iterator::base_type(Pair.second, Pair.second)));
  }

  /// \brief Find all the data blocks that start between a range of offsets.
  ///
  /// \param Low  The low offset, inclusive.
  /// \param High The high offset, exclusive.
  ///
  /// \return A range of \ref DataBlock objects that are between the offsets.
  data_block_range findDataBlocksAtOffset(uint64_t Low, uint64_t High) {
    auto& Index = Blocks.get<by_offset>();
    auto LowIt = Index.lower_bound(Low, OffsetCmp());
    auto HighIt = Index.lower_bound(std::max(Low, High), OffsetCmp());
    return boost::make_iterator_range(
        data_block_iterator(data_block_iterator::base_type(LowIt, HighIt)),
        data_block_iterator(data_block_iterator::base_type(HighIt, HighIt)));
  }

  /// \brief Find all the data blocks that start at an address.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref DataBlock objects that are at the address \p A.
  data_block_range findDataBlocksAt(Addr A) {
    if (!Address || A < *Address) {
      // Return an empty range without default-constructing the iterators.
      return findDataBlocksAtOffset(0, 0);
    }
    return findDataBlocksAtOffset(A - *Address);
  }

  /// \brief Find all the data blocks that start between a range of addresses.
  ///
  /// \param Low  The low address, inclusive.
  /// \param High The high address, exclusive.
  ///
  /// \return A range of \ref DataBlock objects that are between the addresses.
  data_block_range findDataBlocksAt(Addr Low, Addr High) {
    if (!Address) {
      // Return an empty range without default-constructing the iterators.
      return findDataBlocksAtOffset(0, 0);
    }
    return findDataBlocksAtOffset(Low - std::min(*Address, Low),
                                  High - std::min(*Address, High));
  }

  /// \brief Find all the data blocks that start at an offset.
  ///
  /// \param Off The offset to look up.
  ///
  /// \return A range of \ref DataBlock objects that are at the offset \p Off.
  const_data_block_range findDataBlocksAtOffset(uint64_t Off) const {
    auto Pair = Blocks.get<by_offset>().equal_range(Off, OffsetCmp());
    return boost::make_iterator_range(
        const_data_block_iterator(
            const_data_block_iterator::base_type(Pair.first, Pair.second)),
        const_data_block_iterator(
            const_data_block_iterator::base_type(Pair.second, Pair.second)));
  }

  /// \brief Find all the data blocks that start between a range of offsets.
  ///
  /// \param Low  The low offset, inclusive.
  /// \param High The high offset, exclusive.
  ///
  /// \return A range of \ref DataBlock objects that are between the offsets.
  const_data_block_range findDataBlocksAtOffset(uint64_t Low,
                                                uint64_t High) const {
    auto& Index = Blocks.get<by_offset>();
    auto LowIt = Index.lower_bound(Low, OffsetCmp());
    auto HighIt = Index.lower_bound(std::max(Low, High), OffsetCmp());
    return boost::make_iterator_range(
        const_data_block_iterator(
            const_data_block_iterator::base_type(LowIt, HighIt)),
        const_data_block_iterator(
            const_data_block_iterator::base_type(HighIt, HighIt)));
  }

  /// \brief Find all the data blocks that start at an address.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref DataBlock objects that are at the address \p A.
  const_data_block_range findDataBlocksAt(Addr A) const {
    if (!Address || A < *Address) {
      // Return an empty range without default-constructing the iterators.
      return findDataBlocksAtOffset(0, 0);
    }
    return findDataBlocksAtOffset(A - *Address);
  }

  /// \brief Find all the data blocks that start between a range of addresses.
  ///
  /// \param Low  The low address, inclusive.
  /// \param High The high address, exclusive.
  ///
  /// \return A range of \ref DataBlock objects that are between the addresses.
  const_data_block_range findDataBlocksAt(Addr Low, Addr High) const {
    if (!Address) {
      // Return an empty range without default-constructing the iterators.
      return findDataBlocksAtOffset(0, 0);
    }
    return findDataBlocksAtOffset(Low - std::min(*Address, Low),
                                  High - std::min(*Address, High));
  }

private:
  /// \class SymbolicExpressionElementBase
  ///
  /// \brief The base class for \ref SymbolicExpressionElement and
  /// \ref ConstSymbolicExpressionElement.
  ///
  /// \tparam ByteIntervalType either "ByteInterval" or "const ByteInterval".
  template <typename ByteIntervalType> class SymbolicExpressionElementBase {
  public:
    /// \brief Construct a new symbolic expression element.
    ///
    /// \param BI_  The interval this symbolic expression belongs to.
    /// \prarm Off_ The offset in the interval this symbolic expression is at.
    /// \param SE_  The \ref SymbolicExpression in \p BI_ at \p Off_.
    SymbolicExpressionElementBase(ByteIntervalType* BI_, uint64_t Off_,
                                  const SymbolicExpression& SE_)
        : BI{BI_}, Off{Off_}, SE{SE_} {}

    /// \brief Get the interval this symbolic expression belongs to.
    ByteIntervalType* getByteInterval() { return BI; }

    /// \brief Get the interval this symbolic expression belongs to.
    const ByteIntervalType* getByteInterval() const { return BI; }

    /// \brief Get the offset in the interval this symbolic expression is at.
    uint64_t getOffset() const { return Off; }

    /// \brief Get the \ref SymbolicExpression in \ref getByteInterval at
    /// \ref getOffset.
    const SymbolicExpression& getSymbolicExpression() const { return SE; }

    /// \brief Convert this \ref SymbolicExpressionElement into a \ref
    /// ConstSymbolicExpressionElement.
    operator SymbolicExpressionElementBase<const ByteIntervalType>() const {
      return SymbolicExpressionElementBase<const ByteIntervalType>(BI, Off, SE);
    }

    /// \class AddressLess
    ///
    /// \brief A comparison function object to order symbolic expression
    /// elements by the address in which they occur.
    struct AddressLess {
      using key_type = std::optional<Addr>;
      static key_type
      key(const SymbolicExpressionElementBase<ByteIntervalType>& SEE) {
        if (auto A = SEE.getByteInterval()->getAddress(); A) {
          return *A + SEE.getOffset();
        }
        return std::nullopt;
      };
      bool operator()(
          const SymbolicExpressionElementBase<ByteIntervalType>& SEE1,
          const SymbolicExpressionElementBase<ByteIntervalType>& SEE2) const {
        return key(SEE1) < key(SEE2);
      }
    };

  private:
    ByteIntervalType* BI;
    uint64_t Off;
    SymbolicExpression SE;
  };

  /// \class SymExprPairToElement
  ///
  /// \brief A transform function object to convert \ref SymbolicExpressions
  /// values into \ref SymbolicExpressionElement objects.
  ///
  /// \tparam SymExprElementType Either \ref SymbolicExpressionElement or \ref
  /// ConstSymbolicExpressionElement.
  template <typename SymExprElementType> class SymExprPairToElement {
    using ByteIntervalType =
        decltype(std::declval<SymExprElementType>().getByteInterval());
    ByteIntervalType BI;

  public:
    explicit SymExprPairToElement(ByteIntervalType BI_) : BI{BI_} {}

    SymExprElementType
    operator()(const SymbolicExpressionMap::value_type& Pair) const {
      return SymExprElementType(BI, Pair.first, Pair.second);
    }
  };

public:
  /// \brief A symbolic expression paired with the information needed to look
  /// up or alter the symbolic expression after the fact.
  using SymbolicExpressionElement = SymbolicExpressionElementBase<ByteInterval>;

  /// \brief A symbolic expression paired with the information needed to look
  /// up or alter the symbolic expression after the fact.
  using ConstSymbolicExpressionElement =
      SymbolicExpressionElementBase<const ByteInterval>;

  /// \brief Iterator over \ref SymbolicExpressionElement objects.
  ///
  /// Results are yielded in offset order, ascending.
  using symbolic_expression_iterator =
      boost::transform_iterator<SymExprPairToElement<SymbolicExpressionElement>,
                                SymbolicExpressionMap::iterator>;
  /// \brief Range of \ref SymbolicExpressionElement objects.
  ///
  /// Results are yielded in offset order, ascending.
  using symbolic_expression_range =
      boost::iterator_range<symbolic_expression_iterator>;
  /// \brief Const iterator over \ref SymbolicExpressionElement objects.
  ///
  /// Results are yielded in offset order, ascending.
  using const_symbolic_expression_iterator = boost::transform_iterator<
      SymExprPairToElement<ConstSymbolicExpressionElement>,
      SymbolicExpressionMap::const_iterator>;
  /// \brief Const range of \ref SymbolicExpressionElement objects.
  ///
  /// Results are yielded in offset order, ascending.
  using const_symbolic_expression_range =
      boost::iterator_range<const_symbolic_expression_iterator>;

  /// \brief Return an iterator to the first \ref SymbolicExpression.
  symbolic_expression_iterator symbolic_expressions_begin() {
    return boost::make_transform_iterator(
        SymbolicExpressions.begin(),
        SymExprPairToElement<SymbolicExpressionElement>(this));
  }
  /// \brief Return a const iterator to the first \ref SymbolicExpression.
  const_symbolic_expression_iterator symbolic_expressions_begin() const {
    return boost::make_transform_iterator(
        SymbolicExpressions.begin(),
        SymExprPairToElement<ConstSymbolicExpressionElement>(this));
  }
  /// \brief Return an iterator to the element following the last \ref
  /// SymbolicExpression.
  symbolic_expression_iterator symbolic_expressions_end() {
    return boost::make_transform_iterator(
        SymbolicExpressions.end(),
        SymExprPairToElement<SymbolicExpressionElement>(this));
  }
  /// \brief Return a const iterator to the element following the last \ref
  /// SymbolicExpression.
  const_symbolic_expression_iterator symbolic_expressions_end() const {
    return boost::make_transform_iterator(
        SymbolicExpressions.end(),
        SymExprPairToElement<ConstSymbolicExpressionElement>(this));
  }
  /// \brief Return a range of the \ref SymbolicExpression objects in this
  /// interval.
  symbolic_expression_range symbolic_expressions() {
    return boost::make_iterator_range(symbolic_expressions_begin(),
                                      symbolic_expressions_end());
  }
  /// \brief Return a const range of the \ref SymbolicExpression objects in
  /// this interval.
  const_symbolic_expression_range symbolic_expressions() const {
    return boost::make_iterator_range(symbolic_expressions_begin(),
                                      symbolic_expressions_end());
  }

  /// \brief Find all the symbolic expressions that start at an offset.
  ///
  /// Note that only one symbolic expression can be at any given offset, so this
  /// iterator will only ever return 0 or 1 elements. This function is provided
  /// for consistency with other \ref Node objects; prefer \ref
  /// getSymbolicExpression instead.
  ///
  /// \param Off The offset to look up.
  ///
  /// \return A range of \ref SymbolicExpression objects that are at the offset
  /// \p Off.
  symbolic_expression_range findSymbolicExpressionsAtOffset(uint64_t Off) {
    auto Pair = SymbolicExpressions.equal_range(Off);
    return boost::make_iterator_range(
        boost::make_transform_iterator(
            Pair.first, SymExprPairToElement<SymbolicExpressionElement>(this)),
        boost::make_transform_iterator(
            Pair.second,
            SymExprPairToElement<SymbolicExpressionElement>(this)));
  }

  /// \brief Find all the symbolic expressions that start between a range of
  /// offsets.
  ///
  /// \param Low  The low offset, inclusive.
  /// \param High The high offset, exclusive.
  ///
  /// \return A range of \ref SymbolicExpression objects that are between the
  /// offsets.
  symbolic_expression_range findSymbolicExpressionsAtOffset(uint64_t Low,
                                                            uint64_t High) {
    return boost::make_iterator_range(
        boost::make_transform_iterator(
            SymbolicExpressions.lower_bound(Low),
            SymExprPairToElement<SymbolicExpressionElement>(this)),
        boost::make_transform_iterator(
            SymbolicExpressions.lower_bound(High),
            SymExprPairToElement<SymbolicExpressionElement>(this)));
  }

  /// \brief Find all the symbolic expressions that start at an address.
  ///
  /// Note that only one symbolic expression can be at any given offset, so this
  /// iterator will only ever return 0 or 1 elements. This function is provided
  /// for consistency with other \ref Node objects; prefer \ref
  /// getSymbolicExpression instead.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref SymbolicExpression objects that are at the address
  /// \p A.
  symbolic_expression_range findSymbolicExpressionsAt(Addr A) {
    if (!Address) {
      return boost::make_iterator_range(symbolic_expressions_end(),
                                        symbolic_expressions_end());
    }
    return findSymbolicExpressionsAtOffset(A - *Address);
  }

  /// \brief Find all the symbolic expressions that start between a range of
  /// addresses.
  ///
  /// \param Low  The low address, inclusive.
  /// \param High The high address, exclusive.
  ///
  /// \return A range of \ref SymbolicExpression objects that are between the
  /// addresses.
  symbolic_expression_range findSymbolicExpressionsAt(Addr Low, Addr High) {
    if (!Address) {
      return boost::make_iterator_range(symbolic_expressions_end(),
                                        symbolic_expressions_end());
    }
    return findSymbolicExpressionsAtOffset(Low - *Address, High - *Address);
  }

  /// \brief Find all the symbolic expressions that start at an offset.
  ///
  /// Note that only one symbolic expression can be at any given offset, so this
  /// iterator will only ever return 0 or 1 elements. This function is provided
  /// for consistency with other \ref Node objects; prefer \ref
  /// getSymbolicExpression instead.
  ///
  /// \param Off The offset to look up.
  ///
  /// \return A range of \ref SymbolicExpression objects that are at the offset
  /// \p Off.
  const_symbolic_expression_range
  findSymbolicExpressionsAtOffset(uint64_t Off) const {
    auto Pair = SymbolicExpressions.equal_range(Off);
    return boost::make_iterator_range(
        boost::make_transform_iterator(
            Pair.first,
            SymExprPairToElement<ConstSymbolicExpressionElement>(this)),
        boost::make_transform_iterator(
            Pair.second,
            SymExprPairToElement<ConstSymbolicExpressionElement>(this)));
  }

  /// \brief Find all the symbolic expressions that start between a range of
  /// offsets.
  ///
  /// \param Low  The low offset, inclusive.
  /// \param High The high offset, exclusive.
  ///
  /// \return A range of \ref SymbolicExpression objects that are between the
  /// offsets.
  const_symbolic_expression_range
  findSymbolicExpressionsAtOffset(uint64_t Low, uint64_t High) const {
    return boost::make_iterator_range(
        boost::make_transform_iterator(
            SymbolicExpressions.lower_bound(Low),
            SymExprPairToElement<ConstSymbolicExpressionElement>(this)),
        boost::make_transform_iterator(
            SymbolicExpressions.lower_bound(High),
            SymExprPairToElement<ConstSymbolicExpressionElement>(this)));
  }

  /// \brief Find all the symbolic expressions that start at an address.
  ///
  /// Note that only one symbolic expression can be at any given offset, so this
  /// iterator will only ever return 0 or 1 elements. This function is provided
  /// for consistency with other \ref Node objects; prefer \ref
  /// getSymbolicExpression instead.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref SymbolicExpression objects that are at the address
  /// \p A.
  const_symbolic_expression_range findSymbolicExpressionsAt(Addr A) const {
    if (!Address) {
      return boost::make_iterator_range(symbolic_expressions_end(),
                                        symbolic_expressions_end());
    }
    return findSymbolicExpressionsAtOffset(A - *Address);
  }

  /// \brief Find all the symbolic expressions that start between a range of
  /// addresses.
  ///
  /// \param Low  The low address, inclusive.
  /// \param High The high address, exclusive.
  ///
  /// \return A range of \ref SymbolicExpression objects that are between the
  /// addresses.
  const_symbolic_expression_range findSymbolicExpressionsAt(Addr Low,
                                                            Addr High) const {
    if (!Address) {
      return boost::make_iterator_range(symbolic_expressions_end(),
                                        symbolic_expressions_end());
    }
    return findSymbolicExpressionsAtOffset(Low - *Address, High - *Address);
  }

  /// \brief Remove a block from this interval.
  ///
  /// \param  B           The block to remove.
  ///
  /// \return Whether or not the operation succeeded. This operation can
  /// fail if the node to remove is not actually part of this node to begin
  /// with.
  ChangeStatus removeBlock(CodeBlock* B);

  /// \brief Remove a block from this interval.
  ///
  /// \param  B           The block to remove.
  ///
  /// \return Whether or not the operation succeeded. This operation can
  /// fail if the node to remove is not actually part of this node to begin
  /// with.
  ChangeStatus removeBlock(DataBlock* B);

  /// \brief Move an existing CodeBlock to be a part of this interval.
  ///
  /// \param  Off         The offset to move the block to.
  /// \param  N           The block to move.
  ///
  /// \return a ChangeStatus indicating whether the insertion took place
  /// (\c Accepted), was unnecessary because this node already contained the
  /// CodeBlock (\c NoChange), or could not be completed (\c Rejected).
  ChangeStatus addBlock(uint64_t Off, CodeBlock* N);

  /// \brief Move an existing DataBlock to be a part of this interval.
  ///
  /// \param  Off         The offset to move the block to.
  /// \param  N           The block to move.
  ///
  /// \return a ChangeStatus indicating whether the insertion took place
  /// (\c Accepted), was unnecessary because this node already contained the
  /// DataBlock (\c NoChange), or could not be completed (\c Rejected).
  ChangeStatus addBlock(uint64_t Off, DataBlock* N);

  /// \brief Creates a new \ref Block of the given type at a given offset.
  ///
  /// \tparam BlockType Either \ref CodeBlock or \ref DataBlock.
  /// \tparam Args  The arguments to construct a \ref CodeBlock.
  /// \param  C     The \ref Context to use.
  /// \param  O     The offset to add the new \ref CodeBlock at.
  /// \param  A     The arguments to construct a \ref CodeBlock.
  /// \return       The newly created \ref CodeBlock.
  template <typename BlockType, typename... Args>
  BlockType* addBlock(Context& C, uint64_t O, Args&&... A) {
    BlockType* B = BlockType::Create(C, std::forward<Args>(A)...);
    [[maybe_unused]] ChangeStatus Status = addBlock(O, B);
    // addBlock(uint64_t, BlockType*) does not currently reject any insertions
    // and the result cannot be NoChange because we just inserted a newly
    // created ByteInterval.
    assert(Status == ChangeStatus::Accepted &&
           "unexpected result when inserting ByteInterval");
    return B;
  }

  /// \brief Adds a new \ref SymbolicExpression to this interval.
  ///
  /// \param  Off       The offset to add the new \ref SymbolicExpression at.
  /// \param  SymExpr   An existing \ref SymbolicExpression to copy into this
  ///                   interval.
  /// \return           The newly created \ref SymbolicExpression.
  SymbolicExpression& addSymbolicExpression(uint64_t Off,
                                            const SymbolicExpression& SymExpr) {
    SymbolicExpressions[Off] = SymExpr;
    return SymbolicExpressions[Off];
  }

  /// \brief Adds a new \ref SymbolicExpression to this interval.
  ///
  /// \tparam ExprType  The type of symbolic expression to create
  ///                   (\ref SymAddrConst, \ref SymAddrAddr, etc).
  /// \tparam Args      The arguments to construct something of ExprType.
  /// \param  O         The offset to add the new \ref SymbolicExpression at.
  /// \param  A         The arguments to construct something of ExprType.
  /// \return           The newly created \ref SymbolicExpression.
  template <class ExprType, class... Args>
  SymbolicExpression& addSymbolicExpression(uint64_t Off, Args... A) {
    SymbolicExpressions[Off] = ExprType{A...};
    return SymbolicExpressions[Off];
  }

  /// \brief Removes a \ref SymbolicExpression at the given offset, if
  /// present.
  ///
  /// \param Off  The offset of the \ref SymbolicExpression to remove.
  ///
  /// \return Whether or not the operation succeeded. This operation can
  /// fail if the node to remove is not actually part of this node to begin
  /// with.
  bool removeSymbolicExpression(uint64_t Off) {
    std::size_t N;
    N = SymbolicExpressions.erase(Off);
    return N != 0;
  }

  /// \brief Get the symbolic expression at the given offset, if present.
  ///
  /// \param Off  The offset of the \ref SymbolicExpression to return.
  /// \return   The \ref SymbolicExpression at that offset, or nullptr if
  /// there
  ///           is no \ref SymbolicExpression at that offset.
  SymbolicExpression* getSymbolicExpression(uint64_t Off) {
    if (auto It = SymbolicExpressions.find(Off);
        It != SymbolicExpressions.end()) {
      return &It->second;
    }
    return nullptr;
  }

  /// \brief Get the symbolic expression at the given offset, if present.
  ///
  /// \param Off  The offset of the \ref SymbolicExpression to return.
  /// \return   The \ref SymbolicExpression at that offset, or nullptr if
  /// there
  ///           is no \ref SymbolicExpression at that offset.
  const SymbolicExpression* getSymbolicExpression(uint64_t Off) const {
    if (auto It = SymbolicExpressions.find(Off);
        It != SymbolicExpressions.end()) {
      return &It->second;
    }
    return nullptr;
  }

  /// \brief Set or clear the address of this interval.
  ///
  /// \param A  Either the new address, or an empty \ref std::optional if you
  ///           wish to remove the address.
  void setAddress(std::optional<Addr> A);

  /// \brief Get the size of this interval in bytes.
  ///
  /// If this number is greater than the value returned by \ref
  /// getInitializedSize, this indicates that the high addresses taken up by
  /// this interval consist of uninitialized bytes. This often occurs in BSS
  /// sections, where data is zero-initialized rather than stored as zeroes in
  /// the binary.
  uint64_t getSize() const { return Size; }

  /// \brief Set the size of this interval.
  ///
  /// This will also adjust \ref getInitializedSize if the size given is less
  /// than the initialized size.
  ///
  /// \param S  The new size.
  void setSize(uint64_t S);

  /// \brief Get the number of initialized bytes in this interval.
  ///
  /// Not all bytes in this interval may correspond to bytes physically stored
  /// in the underlying file format. This can occur, for example, in BSS
  /// sections, which are zero-initialized at loadtime, but these zeroes are
  /// not stored in the file itself. If this number is smaller than the value
  /// returned by \ref getSize, this indicates that any bytes past this number
  /// are unitialized bytes with values determined at loadtime. As such, all
  /// bytes past this number in this interval's byte vector are truncated when
  /// saving to file.
  ///
  /// This number will never be larger than the value returned by \ref
  /// getSize.
  uint64_t getInitializedSize() const { return Bytes.size(); }

  /// \brief Set the number of initialized bytes in this interval.
  ///
  /// Not all bytes in this interval may correspond to bytes physically stored
  /// in the underlying file format. This can occur, for example, in BSS
  /// sections, which are zero-initialized at loadtime, but these zeroes are
  /// not stored in the file itself. If this number is smaller than the value
  /// returned by \ref getSize, this indicates that any bytes past this number
  /// are unitialized bytes with values determined at loadtime. As such, all
  /// bytes past this number in this interval's byte vector are truncated when
  /// saving to file.
  ///
  /// If the number specified is larger than \ref getSize, then
  /// the byte vector is expanded with zeroes to be equal to the new allocated
  /// size.
  void setInitializedSize(uint64_t S) {
    Bytes.resize(S);
    if (S > getSize()) {
      setSize(S);
    }
  }

private:
  // Wrapper to boost::endian::conditional_reverse which skips the call for
  // 1-byte types (char, [un]signed char, [u]int8_t).
  // This layer was added to work around a bug in boost 1.67 (fixed as of 1.74)
  // which gave wrong results for T=char.
  // It also allows BytesReference to work for std::byte.
  template <typename T>
  static inline std::enable_if_t<sizeof(T) != 1, T>
  endian_flip(T From, boost::endian::order In, boost::endian::order Out) {
    return boost::endian::conditional_reverse(From, In, Out);
  }
  template <typename T>
  static inline std::enable_if_t<sizeof(T) == 1, T>
  endian_flip(T From, boost::endian::order, boost::endian::order) {
    return From;
  }

  /// \class BytesReference
  ///
  /// \brief A reference to a section of the byte interval, allowing for
  /// seamless reading and writing of chunks of data.
  ///
  /// \tparam ByteIntervalType  Either "ByteInterval" or
  ///                           "const ByteInterval".
  /// \tparam T  The type of the data to iterate over. Must be a POD
  ///            type that satisfies Boost's EndianReversible concept.
  template <typename ByteIntervalType, typename T> class BytesReference {
  public:
    BytesReference(ByteIntervalType* BI_, size_t I_,
                   boost::endian::order InputOrder_,
                   boost::endian::order OutputOrder_)
        : BI(BI_), I(I_), InputOrder(InputOrder_), OutputOrder(OutputOrder_) {}

    /// \brief Use this reference as an rvalue.
    ///
    /// This method automatically handles endian conversions.
    /// If uninitlized bytes are read from, then those bytes are treated as
    /// zeroes.
    operator T() const {
      assert(I + sizeof(T) <= BI->Size &&
             "read into interval's bytes out of bounds!");

      auto S = BI->Bytes.size();

      if (I >= S) {
        // anything this far past the end of initialized bytes is composed of
        // all zero bytes, so we return what T would have been interpreted as
        // if all bytes are zero.
        //
        // (note that you may be tempted to replace this with "return T{};",
        // but beware: T might be a non-scalar type whose default constructor
        // differs from the value returned when all bytes are re-interpeted as
        // zeroes. A similar argument exists for "return T{0};".)
        const std::array<uint8_t, sizeof(T)> Array{};
        return *reinterpret_cast<const T*>(Array.data());
      }

      if (sizeof(T) > S - I) {
        // Here, I < S < I + sizeof(T), so we need to partially fill the
        // initialized bytes and combine it with zeroes for the uninitialized
        // bytes. The condition is S - I < sizeof(T) not S < I + sizeof(T) to
        // help compilers verify the bounds in the std::copy_n below are safe.
        std::array<uint8_t, sizeof(T)> Array{};
        std::copy_n(BI->Bytes.begin() + I, S - I, Array.begin());
        return endian_flip(*reinterpret_cast<const T*>(Array.data()),
                           InputOrder, OutputOrder);
      }

      return endian_flip(*reinterpret_cast<const T*>(BI->Bytes.data() + I),
                         InputOrder, OutputOrder);
    }

    /// \brief Use this reference as an lvalue.
    ///
    /// This method automatically handles endian conversions.
    /// If uninitlized bytes are written to, then the initialized byte count
    /// is adjusted (see \ref getInitializedSize for details), padding with
    /// zeroes as necesary.
    BytesReference<ByteIntervalType, T>& operator=(const T& rhs) {
      assert(I + sizeof(T) <= BI->Size &&
             "write into interval's bytes out of bounds!");

      if (I + sizeof(T) > BI->Bytes.size()) {
        BI->Bytes.resize(I + sizeof(T));
      }

      *reinterpret_cast<T*>(BI->Bytes.data() + I) =
          endian_flip(rhs, OutputOrder, InputOrder);
      return *this;
    }

    ByteIntervalType* BI;
    size_t I;
    boost::endian::order InputOrder;
    boost::endian::order OutputOrder;
  };

  /// \brief An iterator over the bytes in this byte vector.
  ///
  /// \tparam ByteIntervalType  Either "ByteInterval" or
  ///                           "const ByteInterval".
  /// \tparam T  The type of the data to iterate over. Must be a POD
  ///            type that satisfies Boost's EndianReversible concept.
  template <typename ByteIntervalType, typename T>
  class BytesBaseIterator
      : public boost::iterator_facade<BytesBaseIterator<ByteIntervalType, T>, T,
                                      boost::random_access_traversal_tag,
                                      BytesReference<ByteIntervalType, T>> {
  private:
    using self = BytesBaseIterator<ByteIntervalType, T>;

    BytesBaseIterator(ByteIntervalType* BI_, size_t I_,
                      boost::endian::order InputOrder_,
                      boost::endian::order OutputOrder_)
        : BI(BI_), I(I_), InputOrder(InputOrder_), OutputOrder(OutputOrder_) {}

  public:
    using reference = BytesReference<ByteIntervalType, T>;

    /// \brief Default-construct an iterator to a byte interval's bytes.
    ///
    /// A default-constructed iterator compares equal only to other
    /// default-constructed iterators. Dereferencing, incremending, or
    /// decrementing a default-constructed iterator results in undefined
    /// behavior.
    BytesBaseIterator() = default;

    // Beginning of functions for iterator facade compatibility.
    reference dereference() const {
      assert(BI && "attempt to dereference default-constructed byte iterator!");
      return reference(BI, I, InputOrder, OutputOrder);
    }

    bool equal(const self& other) const {
      return BI == other.BI && I == other.I;
    }

    void increment() {
      assert(BI && "attempt to increment default-constructed byte iterator!");
      I += sizeof(T);
    }

    void decrement() {
      assert(BI && "attempt to decrement default-constructed byte iterator!");
      I -= sizeof(T);
    }

    void advance(typename self::difference_type n) {
      assert(BI && "attempt to advance default-constructed byte iterator!");
      I += n * sizeof(T);
    }

    typename self::difference_type distance_to(const self& other) const {
      return (other.I - I) / sizeof(T);
    }
    // End of functions for iterator facade compatibility.

    /// \brief Convert this iterator into a const iterator.
    operator BytesBaseIterator<const ByteIntervalType, T>() const {
      return BytesBaseIterator<const ByteIntervalType, T>(BI, I, InputOrder,
                                                          OutputOrder);
    }

  private:
    ByteIntervalType* BI{nullptr};
    size_t I{0};
    boost::endian::order InputOrder{boost::endian::order::native};
    boost::endian::order OutputOrder{boost::endian::order::native};

    friend class ByteInterval;
  };

public:
  /// \brief Iterator over bytes.
  ///
  /// \tparam T  The type of data stored in this byte vector. Must be a
  /// POD type that satisfies Boost's EndianReversible concept.
  template <typename T>
  using bytes_iterator = BytesBaseIterator<ByteInterval, T>;
  /// \brief Range over bytes.
  ///
  /// \tparam T  The type of data stored in this byte vector. Must be a
  /// POD type that satisfies Boost's EndianReversible concept.
  template <typename T>
  using bytes_range = boost::iterator_range<bytes_iterator<T>>;
  /// \brief Const iterator over bytes.
  ///
  /// \tparam T  The type of data stored in this byte vector. Must be a
  /// POD type that satisfies Boost's EndianReversible concept.
  template <typename T>
  using const_bytes_iterator = BytesBaseIterator<const ByteInterval, T>;
  /// \brief Const range over bytes.
  ///
  /// \tparam T  The type of data stored in this byte vector. Must be a
  /// POD type that satisfies Boost's EndianReversible concept.
  template <typename T>
  using const_bytes_range = boost::iterator_range<const_bytes_iterator<T>>;

  /// \brief Get an iterator to the beginning of this byte vector.
  ///
  /// \tparam T  The type of data stored in this byte vector. Must be a
  /// POD type that satisfies Boost's EndianReversible concept.
  template <typename T> bytes_iterator<T> bytes_begin() {
    return bytes_begin<T>(getBoostEndianOrder());
  }

  /// \brief Get an iterator to the beginning of this byte vector.
  ///
  /// \tparam T  The type of data stored in this byte vector. Must be a
  /// POD type that satisfies Boost's EndianReversible concept.
  ///
  /// \param  InputOrder  The endianness of the data in the vector.
  /// \param  OutputOrder The endianness you wish to read out from the vector.
  template <typename T>
  bytes_iterator<T>
  bytes_begin(boost::endian::order InputOrder,
              boost::endian::order OutputOrder = boost::endian::order::native) {
    return bytes_iterator<T>(this, 0, InputOrder, OutputOrder);
  }

  /// \brief Get an iterator past the end of this byte vector.
  ///
  /// \tparam T  The type of data stored in this byte vector. Must be a
  /// POD type that satisfies Boost's EndianReversible concept.
  template <typename T> bytes_iterator<T> bytes_end() {
    return bytes_end<T>(getBoostEndianOrder());
  }

  /// \brief Get an iterator past the end of this byte vector.
  ///
  /// \tparam T  The type of data stored in this byte vector. Must be a
  /// POD type that satisfies Boost's EndianReversible concept.
  ///
  /// \param  InputOrder  The endianness of the data in the vector.
  /// \param  OutputOrder The endianness you wish to read out from the vector.
  template <typename T>
  bytes_iterator<T>
  bytes_end(boost::endian::order InputOrder,
            boost::endian::order OutputOrder = boost::endian::order::native) {
    return bytes_iterator<T>(this, Size, InputOrder, OutputOrder);
  }

  /// \brief Get a range of data in this byte vector.
  ///
  /// \tparam T  The type of data stored in this byte vector. Must be a
  /// POD type that satisfies Boost's EndianReversible concept.
  template <typename T> bytes_range<T> bytes() {
    return bytes<T>(getBoostEndianOrder());
  }

  /// \brief Get a range of data in this byte vector.
  ///
  /// \tparam T  The type of data stored in this byte vector. Must be a
  /// POD type that satisfies Boost's EndianReversible concept.
  ///
  /// \param  InputOrder  The endianness of the data in the vector.
  /// \param  OutputOrder The endianness you wish to read out from the vector.
  template <typename T>
  bytes_range<T>
  bytes(boost::endian::order InputOrder,
        boost::endian::order OutputOrder = boost::endian::order::native) {
    return bytes_range<T>(bytes_begin<T>(InputOrder, OutputOrder),
                          bytes_end<T>(InputOrder, OutputOrder));
  }

  /// \brief Get an iterator to the beginning of this byte vector.
  ///
  /// \tparam T  The type of data stored in this byte vector. Must be a
  /// POD type that satisfies Boost's EndianReversible concept.
  template <typename T> const_bytes_iterator<T> bytes_begin() const {
    return bytes_begin<T>(getBoostEndianOrder());
  }

  /// \brief Get an iterator to the beginning of this byte vector.
  ///
  /// \tparam T  The type of data stored in this byte vector. Must be a
  /// POD type that satisfies Boost's EndianReversible concept.
  ///
  /// \param  InputOrder  The endianness of the data in the vector.
  /// \param  OutputOrder The endianness you wish to read out from the vector.
  template <typename T>
  const_bytes_iterator<T> bytes_begin(
      boost::endian::order InputOrder,
      boost::endian::order OutputOrder = boost::endian::order::native) const {
    return const_bytes_iterator<T>(this, 0, InputOrder, OutputOrder);
  }

  /// \brief Get an iterator past the end of this byte vector.
  ///
  /// \tparam T  The type of data stored in this byte vector. Must be a
  /// POD type that satisfies Boost's EndianReversible concept.
  template <typename T> const_bytes_iterator<T> bytes_end() const {
    return bytes_end<T>(getBoostEndianOrder());
  }

  /// \brief Get an iterator past the end of this byte vector.
  ///
  /// \tparam T  The type of data stored in this byte vector. Must be a
  /// POD type that satisfies Boost's EndianReversible concept.
  ///
  /// \param  InputOrder  The endianness of the data in the vector.
  /// \param  OutputOrder The endianness you wish to read out from the vector.
  template <typename T>
  const_bytes_iterator<T> bytes_end(
      boost::endian::order InputOrder,
      boost::endian::order OutputOrder = boost::endian::order::native) const {
    return const_bytes_iterator<T>(this, Size, InputOrder, OutputOrder);
  }

  /// \brief Get a range of data in this byte vector.
  ///
  /// \tparam T  The type of data stored in this byte vector. Must be a
  /// POD type that satisfies Boost's EndianReversible concept.
  template <typename T> const_bytes_range<T> bytes() const {
    return bytes<T>(getBoostEndianOrder());
  }

  /// \brief Get a range of data in this byte vector.
  ///
  /// \tparam T  The type of data stored in this byte vector. Must be a
  /// POD type that satisfies Boost's EndianReversible concept.
  ///
  /// \param  InputOrder  The endianness of the data in the vector.
  /// \param  OutputOrder The endianness you wish to read out from the vector.
  template <typename T>
  const_bytes_range<T>
  bytes(boost::endian::order InputOrder,
        boost::endian::order OutputOrder = boost::endian::order::native) const {
    return const_bytes_range<T>(bytes_begin<T>(InputOrder, OutputOrder),
                                bytes_end<T>(InputOrder, OutputOrder));
  }

private:
  /// \brief Insert data into this byte vector.
  ///
  /// \tparam T  The type of data you wish to insert into the byte
  /// vector. Must be a POD type that satisfies Boost's EndianReversible
  /// concept.
  ///
  /// \tparam BytesIterator  The type of iterator you wish to determine
  /// the position of where the inserted data will go.
  ///
  /// \tparam InputIterator       The type of an iterator yielding T.
  ///
  /// \param  Pos           The position in the byte vector to insert data at.
  /// \param  Begin         The start of the data to insert.
  /// \param  End           The end of the data to insert.
  ///
  /// \return An iterator pointing to the first element inserted by this call.
  template <typename T, typename BytesIterator, typename InputIterator>
  BytesIterator insertByteVec(
      BytesIterator Pos, InputIterator Begin, InputIterator End,
      boost::endian::order VectorOrder,
      boost::endian::order ElementsOrder = boost::endian::order::native) {
    static_assert(
        std::is_same<BytesIterator, bytes_iterator<T>>::value ||
            std::is_same<BytesIterator, const_bytes_iterator<T>>::value,
        "Pos must be a byte_iterator<T> or a const_byte_iterator<T>");

    auto N = std::distance(Begin, End) * sizeof(T);
    setSize(Size + N);
    // If the position to insert is currently outside the initilized bytes,
    // we let the iterator's operator= handle resizing the byte vector,
    // otherwise we insert zeroes and then overwrite them via said operator=.
    if (Pos.I < Bytes.size()) {
      Bytes.insert(Bytes.begin() + Pos.I, N, 0);
    }
    // std::copy calls operator= one time for every element in the input iter.
    std::copy(Begin, End,
              bytes_iterator<T>(this, Pos.I, VectorOrder, ElementsOrder));
    return Pos;
  }

  /// \brief Insert a single datum into this byte vector.
  ///
  /// \tparam T  The type of data you wish to insert into the byte
  /// vector. Must be a POD type that satisfies Boost's EndianReversible
  /// concept.
  ///
  /// \tparam BytesIterator  The type of iterator you wish to determine
  /// the position of where the inserted data will go.
  ///
  /// \param  Pos           The position in the byte vector to insert data at.
  /// \param  X             The data to insert.
  /// \param  VectorOrder   The endianness of the data in the byte vector.
  /// \param  ElementOrder  The endianness of the data to be inserted.
  ///
  /// \return An iterator pointing to the element inserted by this call.
  template <typename T, typename BytesIterator>
  BytesIterator insertSingleByte(
      BytesIterator Pos, const T& X, boost::endian::order VectorOrder,
      boost::endian::order ElementOrder = boost::endian::order::native) {
    return insertByteVec<T>(Pos, &X, &X + 1, VectorOrder, ElementOrder);
  }

public:
  /// \brief Insert a single datum into this byte vector.
  ///
  /// \tparam T  The type of data you wish to insert into the byte
  /// vector. Must be a POD type that satisfies Boost's EndianReversible
  /// concept.
  ///
  /// \param  Pos           The position in the byte vector to insert data at.
  /// \param  X             The data to insert.
  ///
  /// \return An iterator pointing to the element inserted by this call.
  template <typename T>
  const_bytes_iterator<T> insertBytes(const const_bytes_iterator<T> Pos,
                                      const T& X) {
    return insertBytes<T>(Pos, X, getBoostEndianOrder());
  }

  /// \brief Insert a single datum into this byte vector.
  ///
  /// \tparam T  The type of data you wish to insert into the byte
  /// vector. Must be a POD type that satisfies Boost's EndianReversible
  /// concept.
  ///
  /// \param  Pos           The position in the byte vector to insert data at.
  /// \param  X             The data tprivato insert.
  ///
  /// \return An iterator pointing to the element inserted by this call.
  template <typename T>
  bytes_iterator<T> insertBytes(bytes_iterator<T> Pos, const T& X) {
    return insertBytes<T>(Pos, X, getBoostEndianOrder());
  }

  /// \brief Insert a single datum into this byte vector.
  ///
  /// \tparam T  The type of data you wish to insert into the byte
  /// vector. Must be a POD type that satisfies Boost's EndianReversible
  /// concept.
  ///
  /// \param  Pos           The position in the byte vector to insert data at.
  /// \param  X             The data to insert.
  /// \param  VectorOrder   The endianness of the data in the byte vector.
  /// \param  ElementOrder  The endianness of the data to be inserted.
  ///
  /// \return An iterator pointing to the element inserted by this call.
  template <typename T>
  const_bytes_iterator<T> insertBytes(
      const const_bytes_iterator<T> Pos, const T& X,
      boost::endian::order VectorOrder,
      boost::endian::order ElementOrder = boost::endian::order::native) {
    return insertSingleByte<T>(Pos, X, VectorOrder, ElementOrder);
  }

  /// \brief Insert a single datum into this byte vector.
  ///
  /// \tparam T  The type of data you wish to insert into the byte
  /// vector. Must be a POD type that satisfies Boost's EndianReversible
  /// concept.
  ///
  /// \param  Pos           The position in the byte vector to insert data at.
  /// \param  X             The data to insert.
  /// \param  VectorOrder   The endianness of the data in the byte vector.
  /// \param  ElementOrder  The endianness of the data to be inserted.
  ///
  /// \return An iterator pointing to the element inserted by this call.
  template <typename T>
  bytes_iterator<T> insertBytes(
      bytes_iterator<T> Pos, const T& X, boost::endian::order VectorOrder,
      boost::endian::order ElementOrder = boost::endian::order::native) {
    return insertSingleByte<T>(Pos, X, VectorOrder, ElementOrder);
  }

  /// \brief Insert data into this byte vector.
  ///
  /// \tparam T  The type of data you wish to insert into the byte
  /// vector. Must be a POD type that satisfies Boost's EndianReversible
  /// concept.
  ///
  /// \tparam InputIterator      The type of an iterator yielding T.
  ///
  /// \param  Pos           The position in the byte vector to insert data at.
  /// \param  Begin         The start of the data to insert.
  /// \param  End           The end of the data to insert.
  ///
  /// \return An iterator pointing to the first element inserted by this call.

  template <typename T, typename InputIterator>
  const_bytes_iterator<T> insertBytes(const const_bytes_iterator<T> Pos,
                                      InputIterator Begin, InputIterator End) {
    return insertBytes<T>(Pos, Begin, End, getBoostEndianOrder());
  }
  /// \brief Insert data into this byte vector.
  ///
  /// \tparam T  The type of data you wish to insert into the byte
  /// vector. Must be a POD type that satisfies Boost's EndianReversible
  /// concept.
  ///
  /// \tparam InputIterator       The type of an iterator yielding T.
  ///
  /// \param  Pos           The position in the byte vector to insert data at.
  /// \param  Begin         The start of the data to insert.
  /// \param  End           The end of the data to insert.
  ///
  /// \return An iterator pointing to the first element inserted by this call.
  template <typename T, typename InputIterator>
  bytes_iterator<T> insertBytes(bytes_iterator<T> Pos, InputIterator Begin,
                                InputIterator End) {
    return insertBytes<T>(Pos, Begin, End, getBoostEndianOrder());
  }

  /// \brief Insert data into this byte vector.
  ///
  /// \tparam T  The type of data you wish to insert into the byte
  /// vector. Must be a POD type that satisfies Boost's EndianReversible
  /// concept.
  ///
  /// \tparam InputIterator             The type of an iterator yielding T.
  ///
  /// \param  Pos           The position in the byte vector to insert data at.
  /// \param  Begin         The start of the data to insert.
  /// \param  End           The end of the data to insert.
  /// \param  VectorOrder   The endianness of the data in the byte vector.
  /// \param  ElementsOrder The endianness of the data to be inserted.
  ///
  /// \return An iterator pointing to the first element inserted by this call.
  template <typename T, typename InputIterator>
  const_bytes_iterator<T> insertBytes(
      const const_bytes_iterator<T> Pos, InputIterator Begin, InputIterator End,
      boost::endian::order VectorOrder,
      boost::endian::order ElementsOrder = boost::endian::order::native) {
    return insertByteVec<T>(Pos, Begin, End, VectorOrder, ElementsOrder);
  }

  /// \brief Insert data into this byte vector.
  ///
  /// \tparam T  The type of data you wish to insert into the byte
  /// vector. Must be a POD type that satisfies Boost's EndianReversible
  /// concept.
  ///
  /// \tparam InputIterator       The type of an iterator yielding T.
  ///
  /// \param  Pos           The position in the byte vector to insert data at.
  /// \param  Begin         The start of the data to insert.
  /// \param  End           The end of the data to insert.
  /// \param  VectorOrder   The endianness of the data in the byte vector.
  /// \param  ElementsOrder The endianness of the data to be inserted.
  ///
  /// \return An iterator pointing to the first element inserted by this call.
  template <typename T, typename InputIterator>
  bytes_iterator<T> insertBytes(
      bytes_iterator<T> Pos, InputIterator Begin, InputIterator End,
      boost::endian::order VectorOrder,
      boost::endian::order ElementsOrder = boost::endian::order::native) {
    return insertByteVec<T>(Pos, Begin, End, VectorOrder, ElementsOrder);
  }

  /// \brief Erase data from this byte vector.
  ///
  /// \tparam T  The type of data you wish to erase.
  ///
  /// \param  Begin The start of the data to erase.
  /// \param  End   The end of the data to erase.
  ///
  /// \return An iterator pointing to the first element after those erased by
  /// this call.

  template <typename T>
  const_bytes_iterator<T> eraseBytes(const const_bytes_iterator<T> Begin,
                                     const const_bytes_iterator<T> End) {
    assert(Begin.I <= End.I && "eraseBytes: Begin > End!");
    assert(Begin.I <= Size && "eraseBytes: Begin out of range!");
    assert(End.I <= Size && "eraseBytes: End out of range!");

    // If the beginning iter is outside the init vector, nothing need be done.
    if (Begin.I < Bytes.size()) {
      if (End.I < Bytes.size()) {
        // All positions are within the initilized vector.
        Bytes.erase(Bytes.begin() + Begin.I, Bytes.begin() + End.I);
      } else {
        // The beginning is within vector, the end isn't; clamp to
        // Bytes.end().
        Bytes.erase(Bytes.begin() + Begin.I, Bytes.end());
      }
    }

    setSize(Size - (End.I - Begin.I));
    return Begin;
  }

  /// \brief Return the raw data underlying this byte vector.
  ///
  /// Much like \ref std::vector::data, this function is low-level and
  /// potentially unsafe. This pointer refers to valid memory only where an
  /// iterator would be valid to point to. Modifying the size of the byte
  /// vector may invalidate this pointer. Any endian conversions will not be
  /// performed.
  ///
  /// \tparam T The type of data stored in this byte vector. Must be a POD
  /// type.
  template <typename T> T* rawBytes() {
    return reinterpret_cast<T*>(Bytes.data());
  }

  /// \brief Return the raw data underlying this byte vector.
  ///
  /// Much like \ref std::vector::data, this function is low-level and
  /// potentially unsafe. This pointer refers to valid memory only where an
  /// iterator would be valid to point to. Modifying the size of the byte
  /// vector may invalidate this pointer. Any endian conversions will not be
  /// performed.
  ///
  /// \tparam T The type of data stored in this byte vector. Must be a POD
  /// type.
  template <typename T> const T* rawBytes() const {
    return reinterpret_cast<const T*>(Bytes.data());
  }

  /// @cond INTERNAL
  static bool classof(const Node* N) {
    return N->getKind() == Kind::ByteInterval;
  }
  /// @endcond

  /// \brief Get the ``boost::endian::order`` of this module, suitable for
  /// passing to the ``bytes`` iterator.
  boost::endian::order getBoostEndianOrder() const;

private:
  ByteInterval(Context& C);

  ByteInterval(Context& C, std::optional<Addr> A, uint64_t S, uint64_t InitSize,
               const UUID& U);

  ByteInterval(Context& C, std::optional<Addr> A, uint64_t S,
               uint64_t InitSize);

  template <typename InputIterator>
  ByteInterval(Context& C, std::optional<Addr> A, uint64_t S, uint64_t InitSize,
               InputIterator Begin, InputIterator End)
      : ByteInterval(C, A, S, 0) {
    Bytes.insert(Bytes.end(), Begin, End);
    Bytes.resize(InitSize);
  }

  template <typename InputIterator>
  ByteInterval(Context& C, std::optional<Addr> A, uint64_t S, uint64_t InitSize,
               InputIterator Begin, InputIterator End, const UUID& U)
      : ByteInterval(C, A, S, 0, U) {
    Bytes.insert(Bytes.end(), Begin, End);
    Bytes.resize(InitSize);
  }

  void setParent(Section* S, ByteIntervalObserver* O) {
    Parent = S;
    Observer = O;
  }

  template <typename InputIterator>
  static ByteInterval* Create(Context& C, std::optional<Addr> Address,
                              InputIterator Begin, InputIterator End,
                              std::optional<uint64_t> Size,
                              std::optional<uint64_t> InitSize, const UUID& U) {
    return C.Create<ByteInterval>(
        C, Address, Size ? *Size : std::distance(Begin, End),
        InitSize ? *InitSize : std::distance(Begin, End), Begin, End, U);
  }

  /// \brief The protobuf message type used for serializing ByteInterval.
  using MessageType = proto::ByteInterval;

  /// \brief Serialize into a protobuf message.
  ///
  /// \param[out] Message   Serialize into this message.
  ///
  /// \return void
  void toProtobuf(MessageType* Message) const;

  /// \brief Construct a ByteInterval from a protobuf message.
  ///
  /// \param C  The Context in which the deserialized ByteInterval will be held.
  /// \param Message  The protobuf message from which to deserialize.
  ///
  /// \return The deserialized ByteInterval object, or null on failure.
  static ErrorOr<ByteInterval*> fromProtobuf(Context& C,
                                             const MessageType& Message);

  /// \brief Populate symbolic expressions from a Protobuf message.
  ///
  /// \param C  The Context in which the deserialized SymbolicExpressions will
  /// be held.
  /// \param Message  The protobuf message from which to deserialize.
  /// \return true if the symbolic expression could be loaded from protobuf,
  /// false otherwise.
  bool symbolicExpressionsFromProtobuf(Context& C, const MessageType& Message);

  // Present for testing purposes only.
  void save(std::ostream& Out) const;

  // Present for testing purposes only.
  static ByteInterval* load(Context& C, std::istream& In);

  // Present for testing purposes only.
  bool loadSymbolicExpressions(Context& C, std::istream& In);

  // Shared implementation for adding CodeBlocks and DataBlocks.
  template <typename BlockType, typename IterType>
  ChangeStatus addBlock(uint64_t Off, BlockType* B);

  // Shared implementation for removing CodeBlocks and DataBlocks.
  template <typename BlockType, typename IterType>
  ChangeStatus removeBlock(BlockType* B);

  Section* Parent{nullptr};
  ByteIntervalObserver* Observer{nullptr};
  std::optional<Addr> Address;
  uint64_t Size{0};
  BlockSet Blocks;
  BlockIntMap BlockOffsets;
  SymbolicExpressionMap SymbolicExpressions;
  std::vector<uint8_t> Bytes;

  std::unique_ptr<CodeBlockObserver> CBO;
  std::unique_ptr<DataBlockObserver> DBO;

  friend class Context;   // Friend to enable Context::Create.
  friend class Section;   // Friend to enable Section::(re)moveByteInterval,
                          // Create, etc.
  friend class CodeBlock; // Friend to enable CodeBlock::getAddress.
  friend class DataBlock; // Friend to enable DataBlock::getAddress.
  friend class Module;    // Allow Module::fromProtobuf to deserialize symbolic
                          // expressions.
  friend struct BlockOffsetLess;
  friend class SerializationTestHarness; // Testing support.
};

///
/// \brief Interface for notifying observers when the ByteInterval is modified.
///

class GTIRB_EXPORT_API ByteIntervalObserver {
public:
  virtual ~ByteIntervalObserver() = default;

  /// \brief Notify the parent when new CodeBlocks are added to the interval.
  ///
  /// Called after the ByteInterval updates its internal state.
  ///
  /// \param BI      the ByteInterval to which the CodeBlocks were added.
  /// \param Blocks  a range containing the new CodeBlocks.
  ///
  /// \return indication of whether the observer accepts the change.
  virtual ChangeStatus addCodeBlocks(ByteInterval* BI,
                                     ByteInterval::code_block_range Blocks) = 0;

  /// \brief Notify the parent when the addresses of existing CodeBlocks change.
  ///
  /// Called after the ByteInterval updates its internal state.
  ///
  /// \param BI      the ByteInterval containing the CodeBlocks.
  /// \param Blocks  a range containing the CodeBlocks that moved.
  ///
  /// \return indication of whether the observer accepts the change.
  virtual ChangeStatus
  moveCodeBlocks(ByteInterval* BI, ByteInterval::code_block_range Blocks) = 0;

  /// \brief Notify the parent when CodeBlocks are removed from the interval.
  ///
  /// Called before the ByteInterval updates its internal state.
  ///
  /// \param BI      the ByteInterval from which the CodeBlocks will be removed.
  /// \param Blocks  a range containing the CodeBlocks to remove.
  ///
  /// \return indication of whether the observer accepts the change.
  virtual ChangeStatus
  removeCodeBlocks(ByteInterval* BI, ByteInterval::code_block_range Blocks) = 0;

  /// \brief Notify the parent when new DataBlocks are added to the interval.
  ///
  /// Called after the ByteInterval updates its internal state.
  ///
  /// \param BI      the ByteInterval to which the DataBlocks were added.
  /// \param Blocks  a range containing the new DataBlocks.
  ///
  /// \return indication of whether the observer accepts the change.
  virtual ChangeStatus addDataBlocks(ByteInterval* BI,
                                     ByteInterval::data_block_range Blocks) = 0;

  /// \brief Notify the parent when the addresses of existing CodeBlocks change.
  ///
  /// Called after the ByteInterval updates its internal state.
  ///
  /// \param BI      the ByteInterval containing the DataBlocks.
  /// \param Blocks  a range containing the DataBlocks that moved.
  ///
  /// \return indication of whether the observer accepts the change.
  virtual ChangeStatus
  moveDataBlocks(ByteInterval* BI, ByteInterval::data_block_range Blocks) = 0;

  /// \brief Notify the parent when DataBlocks are removed from the interval.
  ///
  /// Called before the ByteInterval updates its internal state.
  ///
  /// \param BI      the ByteInterval from which the DataBlocks will be removed.
  /// \param Blocks  a range containing the DataBlocks to remove.
  ///
  /// \return indication of whether the observer accepts the change.
  virtual ChangeStatus
  removeDataBlocks(ByteInterval* BI, ByteInterval::data_block_range Blocks) = 0;

  /// \brief Notify the parent when the range of addresses in the interval
  /// changes.
  ///
  /// Called before the ByteInterval's extent changes. This method should
  /// invoke the callback with \p BI to update its extent.
  ///
  /// \param BI        the ByteInterval that changed.
  /// \param Callback  callable to update the ByteInterval's extent.
  ///
  /// \return indication of whether the observer accepts the change.
  virtual ChangeStatus
  changeExtent(ByteInterval* BI,
               std::function<void(ByteInterval*)> Callback) = 0;
};

} // namespace gtirb

#endif // GTIRB_BYTE_INTERVAL_H


================================================
FILE: include/gtirb/CFG.hpp
================================================
//===- CFG.hpp --------------------------------------------------*- C++ -*-===//
//
//  Copyright (C) 2021 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
#ifndef GTIRB_CFG_H
#define GTIRB_CFG_H

#include <gtirb/Casting.hpp>
#include <gtirb/Export.hpp>
#include <boost/graph/adjacency_list.hpp>
#include <boost/iterator/filter_iterator.hpp>
#include <boost/iterator/indirect_iterator.hpp>
#include <boost/iterator/iterator_facade.hpp>
#include <boost/iterator/transform_iterator.hpp>
#include <boost/range/iterator_range.hpp>
#include <variant>

/// \file CFG.hpp
/// \ingroup CFG_GROUP
/// \brief Types and operations for interprocedural control flow
/// graphs (CFGs).
///
/// \see CFG_GROUP

namespace gtirb {
class CfgNode;
class CodeBlock;

/// \defgroup CFG_GROUP Control Flow Graphs (CFGs)
/// \brief Interprocedural control flow graph, with vertices of type
/// \ref Block.
///
/// See also \ref md_CFG-Edges.
///
/// @{ @}

/// \ingroup CFG_GROUP
/// \brief Indicates whether an edge is conditional on true.
enum class ConditionalEdge : bool {
  OnFalse, ///< \brief Indicates an unconditional edge or a conditional edge
           ///< that fires when the condition is false.
  OnTrue   ///< \brief Indicates a conditional edge that fires when the
           ///< condition is true.
};
GTIRB_EXPORT_API std::ostream& operator<<(std::ostream& OS,
                                          const ConditionalEdge& CE);

/// \ingroup CFG_GROUP
/// \brief Indicates whether an edge represents indirect control flow.
enum class DirectEdge : bool { IsIndirect, IsDirect };
GTIRB_EXPORT_API std::ostream& operator<<(std::ostream& OS,
                                          const DirectEdge& DE);

/// \ingroup CFG_GROUP
/// \brief Indicates the type of control flow transfer indicated by this edge.
enum class EdgeType { Branch, Call, Fallthrough, Return, Syscall, Sysret };
GTIRB_EXPORT_API std::ostream& operator<<(std::ostream& OS, const EdgeType& ET);

/// \ingroup CFG_GROUP
/// \brief A label on a \ref CFG edge.
using EdgeLabel =
    std::optional<std::tuple<ConditionalEdge, DirectEdge, EdgeType>>;
GTIRB_EXPORT_API std::ostream& operator<<(std::ostream& OS,
                                          const EdgeLabel& Label);
/// @cond INTERNAL

// Helper for constructing the CFG type. The graph property needs to refer to
// the graph's vertex_descriptor type. This is accessible via
// boost::adjacency_list_traits, but requires keeping the template parameters
// for boost::adjacency_list and boost::adjacency_list_traits in sync. This
// helper ensures the relevant parameters are the same for both.
template <class OutEdgeListS = boost::vecS, class VertexListS = boost::vecS,
          class DirectedS = boost::directedS, class EdgeListS = boost::listS>
struct CfgBuilder {
  using vertex_descriptor = typename boost::adjacency_list_traits<
      OutEdgeListS, VertexListS, DirectedS, EdgeListS>::vertex_descriptor;
  using type = boost::adjacency_list<
      OutEdgeListS, VertexListS, DirectedS,
      // Vertices are CfgNodes.
      CfgNode*,
      // Edges have labels.
      EdgeLabel,
      // The graph keeps track of vertex descriptors for
      // each node.
      std::unordered_map<const CfgNode*, vertex_descriptor>, EdgeListS>;
};
/// @endcond

/// \ingroup CFG_GROUP
/// \brief Interprocedural \ref CFG_GROUP "control flow graph", with
/// vertices of type \ref Block.
using CFG = CfgBuilder<boost::listS,         // allow parallel edges
                       boost::listS,         // preserve IDs after mutations
                       boost::bidirectionalS // successor and predecessor edges
                       >::type;
/// @cond INTERNAL
class cfg_node_iter_base
    : public boost::iterator_facade<cfg_node_iter_base,
                                    const boost::vertex_bundle_type<CFG>::type,
                                    CFG::vertex_iterator::iterator_category> {
public:
  cfg_node_iter_base() = default;
  cfg_node_iter_base(const CFG& cfg_, CFG::vertex_iterator& it_)
      : cfg(&cfg_), it(it_) {}

  // Use default move and copy constructors and assignment operators.
  cfg_node_iter_base(const cfg_node_iter_base&) = default;
  cfg_node_iter_base(cfg_node_iter_base&&) = default;
  cfg_node_iter_base& operator=(const cfg_node_iter_base&) = default;
  cfg_node_iter_base& operator=(cfg_node_iter_base&&) = default;

private:
  friend class boost::iterator_core_access;

  void increment() { ++it; }
  void decrement() { --it; }

  std::ptrdiff_t distance_to(const cfg_node_iter_base& other) const {
    return std::distance(it, other.it);
  }

  bool equal(const cfg_node_iter_base& other) const { return it == other.it; }

  const boost::vertex_bundle_type<CFG>::type& dereference() const {
    return (*cfg)[*it];
  }

  const CFG* cfg{nullptr};
  CFG::vertex_iterator it;
};

template <typename ToTy> struct downcast {
  template <typename FromTy> auto operator()(FromTy& Val) const {
    return dyn_cast_or_null<ToTy>(Val);
  }
};

struct not_null {
  template <typename T> bool operator()(const T* t) { return t != nullptr; }
};

template <typename T>
using cfg_node_downcast_iter =
    boost::transform_iterator<downcast<std::remove_const_t<T>>,
                              cfg_node_iter_base>;

template <typename T>
using cfg_node_downcast_not_null_iter =
    boost::filter_iterator<not_null, cfg_node_downcast_iter<T>>;

template <typename T>
class cfg_node_cast_iter
    : public boost::indirect_iterator<cfg_node_downcast_not_null_iter<T>, T> {
private:
  using xform_iterator = cfg_node_downcast_iter<T>;
  using filter_iterator = cfg_node_downcast_not_null_iter<T>;
  using parent = boost::indirect_iterator<filter_iterator, T>;

public:
  cfg_node_cast_iter() : parent() {}

  cfg_node_cast_iter(const CFG& g, CFG::vertex_iterator& first,
                     CFG::vertex_iterator& last)
      : parent(filter_iterator(xform_iterator(cfg_node_iter_base(g, first)),
                               xform_iterator(cfg_node_iter_base(g, last)))) {}

  template <typename OtherT>
  cfg_node_cast_iter(const cfg_node_cast_iter<OtherT>& other) : parent(other) {}
};

/// @endcond

/// \ingroup CFG_GROUP
/// \brief Iterator over CfgNodes (\ref CfgNode).
using cfg_iterator = boost::indirect_iterator<cfg_node_iter_base>;

/// \ingroup CFG_GROUP
/// \brief Const iterator over CfgNodes (\ref CfgNode).
using const_cfg_iterator =
    boost::indirect_iterator<cfg_node_iter_base, const CfgNode>;

/// \ingroup CFG_GROUP
/// \brief Iterator over blocks (\ref Block).
using block_iterator = cfg_node_cast_iter<CodeBlock>;

/// \ingroup CFG_GROUP
/// \brief Constant iterator over blocks (\ref Block).
using const_block_iterator = cfg_node_cast_iter<const CodeBlock>;

/// \ingroup CFG_GROUP
/// \brief Add a node to the CFG.
///
/// If the graph already contains the node, it is not modified.
///
/// \param N    The CFG node to add.
/// \param Cfg  The graph to modify.
///
/// \return A pair consisting of a descriptor to the vertex for that node and a
/// \c bool indicating whether the graph was modified.
GTIRB_EXPORT_API std::pair<CFG::vertex_descriptor, bool> addVertex(CfgNode* B,
                                                                   CFG& Cfg);

/// \ingroup CFG_GROUP
/// \brief Remove a node from the CFG.
///
/// If the graph does not contain the node, it is not modified.
///
/// \param N    The CFG node to remove.
/// \param Cfg  The graph to modify.
///
/// \return A \c bool indicating whether the graph was modified.
GTIRB_EXPORT_API bool removeVertex(CfgNode* N, CFG& Cfg);

/// \ingroup CFG_GROUP
/// \brief Get the boost::graph vertex descriptor for a CfgNode if it is in the
/// graph.
///
/// \param N    The node to query.
/// \param Cfg  The graph to query.
///
/// \return A descriptor which can be used to retrieve the node from the graph.
GTIRB_EXPORT_API std::optional<CFG::vertex_descriptor>
getVertex(const CfgNode* N, const CFG& Cfg);

/// \ingroup CFG_GROUP
/// \brief Create a new edge between two CFG nodes if they exist in the graph.
///
/// \param Cfg   The graph to modify.
/// \param From  The source node.
/// \param To    The target node.
///
/// \return A descriptor which can be used to retrieve the edge from the
/// graph or assign a label. If either CFG node is not present in the graph,
/// returns \c std::nullopt instead.
GTIRB_EXPORT_API std::optional<CFG::edge_descriptor>
addEdge(const CfgNode* From, const CfgNode* To, CFG& Cfg);

/// \ingroup CFG_GROUP
/// \brief Remove all edges between the source and target nodes from the CFG.
///
/// If the graph does not contain any of these nodes, it is not modified.
///
/// \param Cfg  The graph to modify.
/// \param From  The source node.
/// \param To    The target node.
///
/// \return A \c bool indicating whether the graph was modified.
GTIRB_EXPORT_API bool removeEdge(const CfgNode* From, const CfgNode* To,
                                 CFG& Cfg);

/// \ingroup CFG_GROUP
/// \brief Remove all edges with given label between the source and target nodes
/// from the CFG.
///
/// If the graph does not contain any of these nodes, it is not modified.
///
/// \param Cfg  The graph to modify.
/// \param From  The source node.
/// \param To    The target node.
/// \param Label The Edge label. Only edges with this label will be removed.
///
/// \return A \c bool indicating whether the graph was modified.
GTIRB_EXPORT_API bool removeEdge(const CfgNode* From, const CfgNode* To,
                                 EdgeLabel Label, CFG& Cfg);

/// \ingroup CFG_GROUP
/// \brief Get a range of the \ref CfgNode elements in the specified graph.
///
/// \param Cfg  The graph to be iterated over.
///
/// \return a range over the \p Cfg.
GTIRB_EXPORT_API boost::iterator_range<cfg_iterator> nodes(CFG& Cfg);

/// \ingroup CFG_GROUP
/// \brief Get a constant range of the \ref CfgNode elements in the specified
/// graph.
///
/// \param Cfg  The graph to be iterated over.
///
/// \return A range over teh \p Cfg.
GTIRB_EXPORT_API boost::iterator_range<const_cfg_iterator>
nodes(const CFG& Cfg);

/// \ingroup CFG_GROUP
/// \brief Get a range of just the \ref Block elements in the specified graph.
///
/// The returned range will not include any \ref ProxyBlocks. To retrieve those
/// as well, use \ref nodes(CFG&).
///
/// \param Cfg  The graph to be iterated over.
///
/// \return A range over the \ref Blocks in the \p Cfg
GTIRB_EXPORT_API boost::iterator_range<block_iterator> blocks(CFG& Cfg);

/// \ingroup CFG_GROUP
/// \brief Get a constant range of just the \ref Block elements in the specified
/// graph.
///
/// The returned range will not include any \ref ProxyBlocks. To retrieve those
/// as well, use \ref nodes(CFG&).
///
/// \param Cfg  The graph to be iterated over.
///
/// \return A range over the \ref Blocks in the \p Cfg
GTIRB_EXPORT_API boost::iterator_range<const_block_iterator>
blocks(const CFG& Cfg);

/// @cond INTERNAL
// Traits for instantiating cfgEdgeIters as cfgPredecessors.
struct CfgPredecessorTraits {
  using edge_iterator = boost::graph_traits<CFG>::in_edge_iterator;
  static CfgNode* getNode(const CFG::edge_descriptor& EDesc, const CFG& Cfg) {
    return Cfg[source(EDesc, Cfg)];
  }
  static std::pair<edge_iterator, edge_iterator>
  getEdges(const CFG::vertex_descriptor& VtxDescr, const CFG& Cfg) {
    return in_edges(VtxDescr, Cfg);
  }
};
/// @endcond

/// @cond INTERNAL
// Traits for instantiating cfgEdgeIters as cfgSuccessors.
struct CfgSuccessorTraits {
  using edge_iterator = boost::graph_traits<CFG>::out_edge_iterator;
  static CfgNode* getNode(const CFG::edge_descriptor& EDesc, const CFG& Cfg) {
    return Cfg[target(EDesc, Cfg)];
  }
  static std::pair<edge_iterator, edge_iterator>
  getEdges(const CFG::vertex_descriptor& VtxDescr, const CFG& Cfg) {
    return out_edges(VtxDescr, Cfg);
  }
};
/// @endcond

/// @cond INTERNAL
/// \brief Convert a CFG edge_descriptor to a pair<[const] CfgNode*, EdgeLabel>.
///
/// \tparam Traits     Controls edge direction (predecessor vs successor).
/// \tparam CfgNodePtr Specifies constness of the returned CfgNode.
template <class Traits, typename CfgNodePtr> struct EdgeDescrToNodeLabel {
  // Yes, this stores a const CFG* even for the version that returns a
  // non-const CfgNode.  We can do this because the constness of the two are
  // actually independent, though we maintain the illusion of their related
  // constness in the public interface functions cfgPredecessors and
  // cfgSuccessors.
  const CFG* Cfg = nullptr; // Should only be null for end iterator

  EdgeDescrToNodeLabel() = default;
  EdgeDescrToNodeLabel(const CFG* G) : Cfg(G) {}
  // This quasi-copy constructor enables conversion from non-const iterator to
  // const iterator, but not vice versa.
  EdgeDescrToNodeLabel(const EdgeDescrToNodeLabel<Traits, CfgNode*>& Rhs)
      : Cfg(Rhs.Cfg) {}

  std::pair<CfgNodePtr, EdgeLabel>
  operator()(const CFG::edge_descriptor& EDesc) const {
    return {Traits::getNode(EDesc, *Cfg), (*Cfg)[EDesc]};
  }
};
/// @endcond

/// @cond INTERNAL
/// \brief Returns a iterator_range to iterate the predecessors or successors
/// of a \ref CfgNode.
///
/// This template method is instantiated as cfgPredecessors and cfgSuccessors
/// for iterating CFG predecessor and successor edges respectively from a given
/// node.  The underlying iterator's value_type (type returned by dereference
/// operator*) is a pair<[const] CfgNode*, EdgeLabel>.
///
/// \tparam Traits     Controls edge direction (predecessor vs successor).
/// \tparam CfgNodePtr Specifies constness of the returned CfgNode.
/// \param G  The \ref CFG containing N.
/// \param N  The \ref CfgNode whose edges will be iterated.
/// \return A range over \p N's predecessors or successors.
template <class Traits, typename CfgNodePtr>
auto cfgEdgeIters(const CFG& G, const CfgNode* N) {
  const std::optional<CFG::vertex_descriptor> OptVtxDescr = getVertex(N, G);
  if (OptVtxDescr == std::nullopt) {
    // FYI: this is the return type
    return boost::iterator_range<
        boost::transform_iterator<EdgeDescrToNodeLabel<Traits, CfgNodePtr>,
                                  typename Traits::edge_iterator>>();
  } else {
    const auto [Begin, End] = Traits::getEdges(OptVtxDescr.value(), G);
    return boost::make_iterator_range(
        boost::make_transform_iterator(
            Begin, EdgeDescrToNodeLabel<Traits, CfgNodePtr>{&G}),
        boost::make_transform_iterator(
            End, EdgeDescrToNodeLabel<Traits, CfgNodePtr>{&G}));
  }
}
/// @endcond

/// \brief iterator_range over a CfgNode's predecessors, non-const version
using cfg_predecessors_range = boost::iterator_range<boost::transform_iterator<
    EdgeDescrToNodeLabel<CfgPredecessorTraits, CfgNode*>,
    CfgPredecessorTraits::edge_iterator>>;
/// \brief iterator_range over a CfgNode's predecessors, const version
using const_cfg_predecessors_range =
    boost::iterator_range<boost::transform_iterator<
        EdgeDescrToNodeLabel<CfgPredecessorTraits, const CfgNode*>,
        CfgPredecessorTraits::edge_iterator>>;
/// \brief iterator_range over a CfgNode's successors, non-const version
using cfg_successors_range = boost::iterator_range<boost::transform_iterator<
    EdgeDescrToNodeLabel<CfgSuccessorTraits, CfgNode*>,
    CfgSuccessorTraits::edge_iterator>>;
/// \brief iterator_range over a CfgNode's successors, const version
using const_cfg_successors_range =
    boost::iterator_range<boost::transform_iterator<
        EdgeDescrToNodeLabel<CfgSuccessorTraits, const CfgNode*>,
        CfgSuccessorTraits::edge_iterator>>;

/// \ingroup CFG_GROUP
/// \brief Returns an iterator_range to iterate the predecessors
/// of a \ref CfgNode.
///
/// To iterate the predecessors of node N in graph G:
/// \code
/// for (auto [PredNode, EdgeLabel] : gtirb::cfgPredecessors(G, N)) { ... }
/// \endcode
///
/// \param G  The \ref CFG containing N.
/// \param N  The \ref CfgNode whose predecessors will be iterated.
/// \return A range over \p N's predecessors.
inline cfg_predecessors_range cfgPredecessors(CFG& G, const CfgNode* N) {
  return cfgEdgeIters<CfgPredecessorTraits, CfgNode*>(G, N);
}
inline const_cfg_predecessors_range cfgPredecessors(const CFG& G,
                                                    const CfgNode* N) {
  return cfgEdgeIters<CfgPredecessorTraits, const CfgNode*>(G, N);
}

/// \ingroup CFG_GROUP
/// \brief Returns an iterator_range to iterate the successors
/// of a \ref CfgNode.
///
/// To iterate the successors of node N in graph G:
/// \code
/// for (auto [SuccNode, EdgeLabel] : gtirb::cfgSuccessors(G, N)) { ... }
/// \endcode
///
/// \param G  The \ref CFG containing N.
/// \param N  The \ref CfgNode whose successors will be iterated.
/// \return A range over \p N's successors.
inline cfg_successors_range cfgSuccessors(CFG& G, const CfgNode* N) {
  return cfgEdgeIters<CfgSuccessorTraits, CfgNode*>(G, N);
}
inline const_cfg_successors_range cfgSuccessors(const CFG& G,
                                                const CfgNode* N) {
  return cfgEdgeIters<CfgSuccessorTraits, const CfgNode*>(G, N);
}

} // namespace gtirb
#endif // GTIRB_CFG_H


================================================
FILE: include/gtirb/Casting.hpp
================================================
//===- Casting.hpp ----------------------------------------------*- C++ -*-===//
//
//  Copyright (C) 2020 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===-Addition License Information-----------------------------------------===//
//
// This file was initially written for the LLVM Compiler Infrastructure
// project where it is distributed under the University of Illinois Open Source
// License. See the LICENSE file in the project root for license terms.
//
//===----------------------------------------------------------------------===//
#ifndef GTIRB_CASTING_H
#define GTIRB_CASTING_H

#include <cassert>
#include <type_traits>

/// @cond INTERNAL
#ifndef GTIRB_WRAP_UTILS_IN_NAMESPACE
#define GTIRB_DEPRECATED_UTILS                                                 \
  [[deprecated("Define GTIRB_WRAP_UTILS_IN_NAMESPACE and access via the "      \
               "gtirb namespace to suppress this error.")]]
#else
#define GTIRB_DEPRECATED_UTILS
#endif
/// @endcond

namespace gtirb {

// We want clients to use the names in the gtirb namespace, so we exclude
// the allocator namespace when generating documentation.
/// @cond INTERNAL
namespace casting {
/// @endcond

/// \file Casting.hpp
/// \ingroup casting
/// \brief The various casting and type checking operations that apply
/// to gtirb::Node subclasses.
///
/// \see \ref casting.

/// \defgroup casting Casting
///
/// \brief \ref gtirb::Node "Node" and its subclasses support custom casting
/// machinery that allows for type checking, safer static casting, and
/// safe dynamic casting without needing the overhead of a vtable or
/// RTTI.
///
/// File Casting.hpp defines the various operations that apply
/// to \ref gtirb::Node "Node" subclasses.
/// - \ref ISA "isa<Ty>" Performs a type check.
/// - \ref CAST "cast<Ty>" Returns the given argument cast to the
///   specified type;  the argument cannot be null.
/// - \ref CAST_OR_NULL "cast_or_null<Ty>" Returns the given argument
///   cast to the specified type; the argument can be null.
/// - \ref DYN_CAST "dyn_cast<Ty>" Returns the given argument cast to
///   the specified type, or null if the casting operation fails
///   because the types do not match; the argument cannot be null.
/// - \ref DYN_CAST_OR_NULL "dyn_cast_or_null<Ty>" Returns the given
///   argument cast to the specified type, or null if the casting
///   operation fails because the types do not match; the argument can
///   be null.
///
/// \section casting_operations Casting Operations
///
/// \subsection ISA isa<Ty>
///
/// Perform a type check.
///
/// \param Val The object to check. Cannot be null.
///
/// \return \c true if \p Val is an instance of the template parameter
/// type, \c false otherwise.
///
/// - isa<Ty>(const Y& Val)
///
/// Example usage:
/// \code
/// void f(Node *N) { if (isa<Block>(N) { ... } }
/// \endcode
///
/// (Deprecated) Available in the global namespace when
/// GTIRB_WRAP_UTILS_IN_NAMESPACE is enabled.
///
///
/// \subsection CAST cast<Ty>
///
/// Cast to the specified type; the argument cannot be null.
///
/// \param Val the value to cast. Cannot be null; consider using
/// \ref CAST_OR_NULL "cast_or_null<Ty>" in that case.
///
/// \return The result of casting \p Val to the specified type.
///   This function asserts that the types match and will not return
///   null on failure.
///
/// - cast<Ty>(Y* Val)
/// - cast<Ty>(Y& Val)
/// - cast<Ty>(const Y& Val)
///
/// Example usage:
/// \code
/// void f(Node * N) { auto *B = cast<Block>(N); }
/// \endcode
///
/// (Deprecated) Available in the global namespace when
/// GTIRB_WRAP_UTILS_IN_NAMESPACE is enabled.
///
/// \subsection CAST_OR_NULL cast_or_null<Ty>
///
/// Cast to the specified type; the argument can be null.
///
/// \param Val the value to cast. Can be null.
///
/// \return The result of casting \p Val to the specified type.
///   This function asserts that the types match and will not return
///   null on failure. If \p Val is null, returns a null pointer cast
///   to the given type.
///
/// - cast_or_null<Ty>(Y* Val)
/// - cast_or_null<Ty>(Y& Val)
/// - cast_or_null<Ty>(const Y& Val)
///
/// Example usage:
/// \code
///  void f(Node *N) { auto *B = cast_or_null<Block>(N); }
/// \endcode
///
/// (Deprecated) Available in the global namespace when
/// GTIRB_WRAP_UTILS_IN_NAMESPACE is enabled.
///
/// \subsection  DYN_CAST dyn_cast<Ty>
///
/// Dynamic cast to the specified type; the argument cannot be null.
///
/// \param Val the value to cast. Cannot be null; consider using
/// \ref DYN_CAST_OR_NULL "dyn_cast_or_null<Ty>" in that case.
///
/// \return The result of casting \p Val to the specified type, or
/// null if the casting operation fails because the types do not
/// match.
///
/// - dyn_cast<Ty>(Y* Val)
/// - dyn_cast<Ty>(Y& Val)
/// - dyn_cast<Ty>(const Y& Val)
///
/// Example usage:
/// \code
/// void f(Node * N) { auto *B = dyn_cast<Block>(N); }
/// \endcode
///
/// (Deprecated) Available in the global namespace when
/// GTIRB_WRAP_UTILS_IN_NAMESPACE is enabled.
///
/// \subsection DYN_CAST_OR_NULL dyn_cast_or_null<Ty>
///
/// Cast to the specified type; the argument can be null.
///
/// \param Val the value to cast. Can be null.
///
/// \return The result of casting \p Val to the specified type, or
/// null if the casting operation fails because the types do not
/// match. If \p Val is null, returns a null pointer cast to the given
/// type.
///
/// - dyn_cast_or_null<Ty>(Y* Val)
/// - dyn_cast_or_null<Ty>(Y& Val)
/// - dyn_cast_or_null<Ty>(const Y& Val)
///
/// Example usage:
/// \code
/// void f(Node *N) { auto *B = dyn_cast_or_null<Block>(N); }
/// \endcode
///
/// (Deprecated) Available in the global namespace when
/// GTIRB_WRAP_UTILS_IN_NAMESPACE is enabled.
///
/// @{ @}

/// \fn isa(const Y& Val)
/// See \ref ISA.

/// \fn cast(Y* Val)
/// See \ref CAST.

/// \fn cast(Y& Val)
/// See \ref CAST.

/// \fn cast(const Y& Val)
/// See \ref CAST.

/// \fn cast_or_null(Y* Val)
/// See \ref CAST_OR_NULL.

/// \fn cast_or_null(Y& Val)
/// See \ref CAST_OR_NULL.

/// \fn cast_or_null(const Y& Val)
/// See \ref CAST_OR_NULL.

/// \fn dyn_cast(Y* Val)
/// See \ref DYN_CAST.

/// \fn dyn_cast(Y& Val)
/// See \ref DYN_CAST.

/// \fn dyn_cast(const Y& Val)
/// See \ref DYN_CAST.

/// \fn dyn_cast_or_null(Y* Val)
/// See \ref DYN_CAST_OR_NULL.

/// \fn dyn_cast_or_null(Y& Val)
/// See \ref DYN_CAST_OR_NULL.

/// \fn dyn_cast_or_null(const Y& Val)
/// See \ref DYN_CAST_OR_NULL.

//===----------------------------------------------------------------------===//
//                          isa<x> Support Templates
//===----------------------------------------------------------------------===//

/// @cond INTERNAL
// Define a template that can be specialized by smart pointers to reflect the
// fact that they are automatically dereferenced, and are not involved with the
// template selection process...  the default implementation is a noop.
//
template <typename From> struct simplify_type {
  using SimpleType = From; // The real type this represents...

  // An accessor to get the real value...
  static SimpleType& getSimplifiedValue(From& Val) { return Val; }
};
/// @endcond

/// @cond INTERNAL
// The core of the implementation of isa<X> is here; To and From should be
// the names of classes.  This template can be specialized to customize the
// implementation of isa<> without rewriting it from scratch.
template <typename To, typename From, typename Enabler = void> struct isa_impl {
  static inline bool doit(const From& Val) { return To::classof(&Val); }
};
/// @endcond

/// @cond INTERNAL
// Always allow upcasts, and perform no dynamic check for them.
template <typename To, typename From>
struct isa_impl<
    To, From, typename std::enable_if<std::is_base_of<To, From>::value>::type> {
  static inline bool doit(const From&) { return true; }
};
/// @endcond

/// @cond INTERNAL
template <typename To, typename From> struct isa_impl_cl {
  static inline bool doit(const From& Val) {
    return isa_impl<To, From>::doit(Val);
  }
};
/// @endcond

/// @cond  INTERNAL
template <typename To, typename From> struct isa_impl_cl<To, const From> {
  static inline bool doit(const From& Val) {
    return isa_impl<To, From>::doit(Val);
  }
};
/// @endcond

/// @cond INTERNAL
template <typename To, typename From> struct isa_impl_cl<To, From*> {
  static inline bool doit(const From* Val) {
    assert(Val && "isa<> used on a null pointer");
    return isa_impl<To, From>::doit(*Val);
  }
};
/// @endcond

/// @cond INTERNAL
template <typename To, typename From> struct isa_impl_cl<To, From* const> {
  static inline bool doit(const From* Val) {
    assert(Val && "isa<> used on a null pointer");
    return isa_impl<To, From>::doit(*Val);
  }
};
/// @endcond

/// @cond INTERNAL
template <typename To, typename From> struct isa_impl_cl<To, const From*> {
  static inline bool doit(const From* Val) {
    assert(Val && "isa<> used on a null pointer");
    return isa_impl<To, From>::doit(*Val);
  }
};
/// @endcond

/// @cond INTERNAL
template <typename To, typename From>
struct isa_impl_cl<To, const From* const> {
  static inline bool doit(const From* Val) {
    assert(Val && "isa<> used on a null pointer");
    return isa_impl<To, From>::doit(*Val);
  }
};
/// @endcond

/// @cond INTERNAL
template <typename To, typename From, typename SimpleFrom>
struct isa_impl_wrap {
  // When From != SimplifiedType, we can simplify the type some more by using
  // the simplify_type template.
  static bool doit(const From& Val) {
    return isa_impl_wrap<To, SimpleFrom,
                         typename simplify_type<SimpleFrom>::SimpleType>::
        doit(simplify_type<const From>::getSimplifiedValue(Val));
  }
};
/// @endcond

/// @cond INTERNAL
template <typename To, typename FromTy>
struct isa_impl_wrap<To, FromTy, FromTy> {
  // When From == SimpleType, we are as simple as we are going to get.
  static bool doit(const FromTy& Val) {
    return isa_impl_cl<To, FromTy>::doit(Val);
  }
};
/// @endcond

// isa<X> - Return true if the parameter to the template is an instance of the
// template type argument.  Used like this:
//
//  if (isa<Type>(myVal)) { ... }
//
template <class X, class Y>
GTIRB_DEPRECATED_UTILS [[nodiscard]] inline bool isa(const Y& Val) {
  return isa_impl_wrap<X, const Y,
                       typename simplify_type<const Y>::SimpleType>::doit(Val);
}

//===----------------------------------------------------------------------===//
//                          cast<x> Support Templates
//===----------------------------------------------------------------------===//
/// @cond INTERNAL
template <class To, class From> struct cast_retty;
/// @endcond

/// @cond INTERNAL
// Calculate what type the 'cast' function should return, based on a requested
// type of To and a source type of From.
template <class To, class From> struct cast_retty_impl {
  using ret_type = To&; // Normal case, return Ty&
};
template <class To, class From> struct cast_retty_impl<To, const From> {
  using ret_type = const To&; // Normal case, return Ty&
};

template <class To, class From> struct cast_retty_impl<To, From*> {
  using ret_type = To*; // Pointer arg case, return Ty*
};

template <class To, class From> struct cast_retty_impl<To, const From*> {
  using ret_type = const To*; // Constant pointer arg case, return const Ty*
};

template <class To, class From> struct cast_retty_impl<To, const From* const> {
  using ret_type = const To*; // Constant pointer arg case, return const Ty*
};
/// @endcond

/// @cond INTERNAL
template <class To, class From, class SimpleFrom> struct cast_retty_wrap {
  // When the simplified type and the from type are not the same, use the type
  // simplifier to reduce the type, then reuse cast_retty_impl to get the
  // resultant type.
  using ret_type = typename cast_retty<To, SimpleFrom>::ret_type;
};

template <class To, class FromTy> struct cast_retty_wrap<To, FromTy, FromTy> {
  // When the simplified type is equal to the from type, use it directly.
  using ret_type = typename cast_retty_impl<To, FromTy>::ret_type;
};

template <class To, class From> struct cast_retty {
  using ret_type = typename cast_retty_wrap<
      To, From, typename simplify_type<From>::SimpleType>::ret_type;
};
/// @endcond

/// @cond INTERNAL
// Ensure the non-simple values are converted using the simplify_type template
// that may be specialized by smart pointers...
//
template <class To, class From, class SimpleFrom> struct cast_convert_val {
  // This is not a simple type, use the template to simplify it...
  static typename cast_retty<To, From>::ret_type doit(From& Val) {
    return cast_convert_val<To, SimpleFrom,
                            typename simplify_type<SimpleFrom>::SimpleType>::
        doit(simplify_type<From>::getSimplifiedValue(Val));
  }
};

template <class To, class FromTy> struct cast_convert_val<To, FromTy, FromTy> {
  // This _is_ a simple type, just cast it.
  static typename cast_retty<To, FromTy>::ret_type doit(const FromTy& Val) {
    typename cast_retty<To, FromTy>::ret_type Res2 =
        (typename cast_retty<To, FromTy>::ret_type) const_cast<FromTy&>(Val);
    return Res2;
  }
};
/// @endcond

/// @cond INTERNAL
template <class X> struct is_simple_type {
  static const bool value =
      std::is_same<X, typename simplify_type<X>::SimpleType>::value;
};
/// @endcond

// cast<X> - Return the argument parameter cast to the specified type.  This
// casting operator asserts that the type is correct, so it does not return null
// on failure.  It does not allow a null argument (use cast_or_null for that).
// It is typically used like this:
//
//  cast<Instruction>(myVal)->getParent()
//
template <class X, class Y>
GTIRB_DEPRECATED_UTILS inline
    typename std::enable_if<!is_simple_type<Y>::value,
                            typename cast_retty<X, const Y>::ret_type>::type
    cast(const Y& Val) {
  assert(isa<X>(Val) && "cast<Ty>() argument of incompatible type!");
  return cast_convert_val<
      X, const Y, typename simplify_type<const Y>::SimpleType>::doit(Val);
}

template <class X, class Y>
GTIRB_DEPRECATED_UTILS inline typename cast_retty<X, Y>::ret_type cast(Y& Val) {
  assert(isa<X>(Val) && "cast<Ty>() argument of incompatible type!");
  return cast_convert_val<X, Y, typename simplify_type<Y>::SimpleType>::doit(
      Val);
}

template <class X, class Y>
GTIRB_DEPRECATED_UTILS inline typename cast_retty<X, Y*>::ret_type
cast(Y* Val) {
  assert(isa<X>(Val) && "cast<Ty>() argument of incompatible type!");
  return cast_convert_val<X, Y*, typename simplify_type<Y*>::SimpleType>::doit(
      Val);
}

// cast_or_null<X> - Functionally identical to cast, except that a null value is
// accepted.
//
template <class X, class Y>
GTIRB_DEPRECATED_UTILS [[nodiscard]] inline
    typename std::enable_if<!is_simple_type<Y>::value,
                            typename cast_retty<X, const Y>::ret_type>::type
    cast_or_null(const Y& Val) {
  if (!Val)
    return nullptr;
  assert(isa<X>(Val) && "cast_or_null<Ty>() argument of incompatible type!");
  return cast<X>(Val);
}

template <class X, class Y>
GTIRB_DEPRECATED_UTILS [[nodiscard]] inline
    typename std::enable_if<!is_simple_type<Y>::value,
                            typename cast_retty<X, Y>::ret_type>::type
    cast_or_null(Y& Val) {
  if (!Val)
    return nullptr;
  assert(isa<X>(Val) && "cast_or_null<Ty>() argument of incompatible type!");
  return cast<X>(Val);
}

template <class X, class Y>
GTIRB_DEPRECATED_UTILS [[nodiscard]] inline typename cast_retty<X, Y*>::ret_type
cast_or_null(Y* Val) {
  if (!Val)
    return nullptr;
  assert(isa<X>(Val) && "cast_or_null<Ty>() argument of incompatible type!");
  return cast<X>(Val);
}

// dyn_cast<X> - Return the argument parameter cast to the specified type.  This
// casting operator returns null if the argument is of the wrong type, so it can
// be used to test for a type as well as cast if successful.  This should be
// used in the context of an if statement like this:
//
//  if (const Instruction *I = dyn_cast<Instruction>(myVal)) { ... }
//

template <class X, class Y>
GTIRB_DEPRECATED_UTILS [[nodiscard]] inline
    typename std::enable_if<!is_simple_type<Y>::value,
                            typename cast_retty<X, const Y>::ret_type>::type
    dyn_cast(const Y& Val) {
  return isa<X>(Val) ? cast<X>(Val) : nullptr;
}

template <class X, class Y>
GTIRB_DEPRECATED_UTILS [[nodiscard]] inline typename cast_retty<X, Y>::ret_type
dyn_cast(Y& Val) {
  return isa<X>(Val) ? cast<X>(Val) : nullptr;
}

template <class X, class Y>
GTIRB_DEPRECATED_UTILS [[nodiscard]] inline typename cast_retty<X, Y*>::ret_type
dyn_cast(Y* Val) {
  return isa<X>(Val) ? cast<X>(Val) : nullptr;
}

// dyn_cast_or_null<X> - Functionally identical to dyn_cast, except that a null
// value is accepted.
//
template <class X, class Y>
GTIRB_DEPRECATED_UTILS [[nodiscard]] inline
    typename std::enable_if<!is_simple_type<Y>::value,
                            typename cast_retty<X, const Y>::ret_type>::type
    dyn_cast_or_null(const Y& Val) {
  return (Val && isa<X>(Val)) ? cast<X>(Val) : nullptr;
}

template <class X, class Y>
GTIRB_DEPRECATED_UTILS [[nodiscard]] inline
    typename std::enable_if<!is_simple_type<Y>::value,
                            typename cast_retty<X, Y>::ret_type>::type
    dyn_cast_or_null(Y& Val) {
  return (Val && isa<X>(Val)) ? cast<X>(Val) : nullptr;
}

template <class X, class Y>
GTIRB_DEPRECATED_UTILS [[nodiscard]] inline typename cast_retty<X, Y*>::ret_type
dyn_cast_or_null(Y* Val) {
  return (Val && isa<X>(Val)) ? cast<X>(Val) : nullptr;
}

/// @cond INTERNAL
} // namespace casting
/// @endcond

#ifdef GTIRB_WRAP_UTILS_IN_NAMESPACE

using casting::cast;
using casting::cast_or_null;
using casting::dyn_cast;
using casting::dyn_cast_or_null;
using casting::isa;

#endif // GTIRB_WRAP_UTILS_IN_NAMESPACE

} // namespace gtirb

#ifndef GTIRB_WRAP_UTILS_IN_NAMESPACE

using gtirb::casting::cast;
using gtirb::casting::cast_or_null;
using gtirb::casting::dyn_cast;
using gtirb::casting::dyn_cast_or_null;
using gtirb::casting::isa;

#endif // GTIRB_WRAP_UTILS_IN_NAMESPACE

#endif // GTIRB_CASTING_H


================================================
FILE: include/gtirb/CfgNode.hpp
================================================
//===- CfgNode.hpp -----------------------------------------------*- C++-*-===//
//
//  Copyright (C) 2020 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
#ifndef GTIRB_CFG_NODE_HPP
#define GTIRB_CFG_NODE_HPP

#include <gtirb/Node.hpp>

/// \file CfgNode.hpp
/// \ingroup CFG_GROUP
/// \brief Base class for nodes of the CFG.
/// \see CFG_GROUP

namespace gtirb {

/// \class CfgNode
///
/// \brief Represents the base of types that can be inserted into the CFG.
class GTIRB_EXPORT_API CfgNode : public Node {
public:
  /// \cond INTERNAL
  static bool classof(const Node* N) { return classofKind(N->getKind()); }
  static bool classofKind(Kind K) {
    return K >= Kind::CfgNode && K <= Kind::LAST_CfgNode;
  }
  /// \endcond
protected:
  CfgNode(Context& C, Kind Knd) : Node(C, Knd) {}
  CfgNode(Context& C, Kind Knd, const UUID& U) : Node(C, Knd, U) {}
};

} // namespace gtirb
#endif // GTIRB_CFG_NODE_HPP


================================================
FILE: include/gtirb/CodeBlock.hpp
================================================
//===- CodeBlock.hpp ---------------------------------------------*- C++-*-===//
//
//  Copyright (C) 2020 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
#ifndef GTIRB_BLOCK_H
#define GTIRB_BLOCK_H

#include <gtirb/Addr.hpp>
#include <gtirb/ByteInterval.hpp>
#include <gtirb/CfgNode.hpp>
#include <gtirb/DecodeMode.hpp>
#include <gtirb/Export.hpp>
#include <gtirb/Node.hpp>
#include <gtirb/proto/CodeBlock.pb.h>
#include <boost/range/iterator_range.hpp>
#include <cstdint>
#include <functional>
#include <optional>
#include <vector>

/// \file CodeBlock.hpp
/// \ingroup CFG_GROUP
/// \brief Class gtirb::CodeBlock.
/// \see CFG_GROUP

namespace gtirb {
template <class T> class ErrorOr;

namespace proto {
class CodeBlock;
} // namespace proto

/// \class CodeBlock
///
/// \brief A basic block.
/// \see \ref CFG_GROUP
class GTIRB_EXPORT_API CodeBlock : public CfgNode {
public:
  /// \brief Create an unitialized CodeBlock object.
  /// \param C        The Context in which this CodeBlock will be held.
  /// \return         The newly created CodeBlock.
  static CodeBlock* Create(Context& C) { return C.Create<CodeBlock>(C); }

  /// \brief Create a CodeBlock object.
  ///
  /// \param C          The Context in which this block will be held.
  /// \param Size       The size of the block in bytes.
  /// \param DMode      The decode mode of the block.
  ///
  /// \return The newly created CodeBlock.
  static CodeBlock* Create(Context& C, uint64_t Size,
                           gtirb::DecodeMode DMode = DecodeMode::Default) {
    return C.Create<CodeBlock>(C, Size, DMode);
  }

  /// \brief Get the \ref ByteInterval this block belongs to.
  ByteInterval* getByteInterval() { return Parent; }
  /// \brief Get the \ref ByteInterval this block belongs to.
  const ByteInterval* getByteInterval() const { return Parent; }

  /// \brief Get the size from a \ref CodeBlock.
  ///
  /// \return The size in bytes.
  ///
  /// Use with CodeBlock::getAddress() to obtain arguments to pass to
  /// ByteMap::data() for an iterator over the contents of a \ref CodeBlock.
  uint64_t getSize() const { return Size; }

  /// \brief Get the decode mode from a \ref CodeBlock.
  ///
  /// This field is used in some ISAs where it is used to
  /// differentiate between sub-ISAs; ARM and Thumb, for example.
  ///
  /// \return The decode mode.
  gtirb::DecodeMode getDecodeMode() const { return this->DecodeMode; }

  /// \brief Get the offset from the beginning of the \ref ByteInterval this
  /// block belongs to.
  uint64_t getOffset() const;

  /// \brief Get the address of this block, if present. See \ref
  /// ByteInterval.getAddress for details on why this address may not be
  /// present.
  std::optional<Addr> getAddress() const;

  /// \brief Set the size of this block.
  ///
  /// Note that this does not automatically update any \ref ByteInterval's size,
  /// bytes, or symbolic expressions. This simply changes the extents of a block
  /// in its \ref ByteInterval.
  void setSize(uint64_t S) {
    if (Observer) {
      std::swap(Size, S);
      [[maybe_unused]] ChangeStatus Status =
          Observer->sizeChange(this, S, Size);
      assert(Status != ChangeStatus::Rejected &&
             "recovering from rejected size change is not implemented yet");
    } else {
      Size = S;
    }
  }

  /// \brief Set the decode mode of this block.
  ///
  /// This field is used in some ISAs where it is used to
  /// differentiate between sub-ISAs; ARM and Thumb, for example.
  void setDecodeMode(gtirb::DecodeMode DM) {
    if (Observer) {
      std::swap(DecodeMode, DM);
      [[maybe_unused]] ChangeStatus Status =
          Observer->decodeModeChange(this, DM, DecodeMode);
      assert(
          Status != ChangeStatus::Rejected &&
          "recovering from rejected decode mode change is not implemented yet");
    } else {
      DecodeMode = DM;
    }
  }

  /// \brief Iterator over bytes in this block.
  ///
  /// \tparam T The type of data stored in this block's byte vector. Must be
  /// a POD type that satisfies Boost's EndianReversible concept.
  template <typename T> using bytes_iterator = ByteInterval::bytes_iterator<T>;
  /// \brief Range over bytes in this block.
  ///
  /// \tparam T The type of data stored in this block's byte vector. Must be
  /// a POD type that satisfies Boost's EndianReversible concept.
  template <typename T> using bytes_range = ByteInterval::bytes_range<T>;
  /// \brief Const iterator over bytes in this block.
  ///
  /// \tparam T The type of data stored in this block's byte vector. Must be
  /// a POD type that satisfies Boost's EndianReversible concept.
  template <typename T>
  using const_bytes_iterator = ByteInterval::const_bytes_iterator<T>;
  /// \brief Const range over bytes in this block.
  ///
  /// \tparam T The type of data stored in this block's byte vector. Must be
  /// a POD type that satisfies Boost's EndianReversible concept.
  template <typename T>
  using const_bytes_range = ByteInterval::const_bytes_range<T>;

  /// \brief Get an iterator to the first byte in this block.
  ///
  /// If this block is not associated with any \ref ByteInterval, than the
  /// behavior of this function is undefined.
  ///
  /// \tparam T The type of data stored in this block's byte vector. Must be
  /// a POD type that satisfies Boost's EndianReversible concept.
  template <typename T> bytes_iterator<T> bytes_begin() {
    assert(Parent && "Block has no byte interval!");
    return bytes_begin<T>(Parent->getBoostEndianOrder());
  }

  /// \brief Get an iterator to the first byte in this block.
  ///
  /// If this block is not associated with any \ref ByteInterval, than the
  /// behavior of this function is undefined.
  ///
  /// \tparam T The type of data stored in this block's byte vector. Must be
  /// a POD type that satisfies Boost's EndianReversible concept.
  ///
  /// \param  InputOrder  The endianness of the data in the block.
  /// \param  OutputOrder The endianness you wish to read out from the block.
  template <typename T>
  bytes_iterator<T>
  bytes_begin(boost::endian::order InputOrder,
              boost::endian::order OutputOrder = boost::endian::order::native) {
    assert(Parent && "Block has no byte interval!");
    return Parent->bytes_begin<T>(InputOrder, OutputOrder) + getOffset();
  }

  /// \brief Get an iterator past the last byte in this block.
  ///
  /// If this block is not associated with any \ref ByteInterval, than the
  /// behavior of this function is undefined.
  ///
  /// \tparam T The type of data stored in this block's byte vector. Must be
  /// a POD type that satisfies Boost's EndianReversible concept.
  template <typename T> bytes_iterator<T> bytes_end() {
    assert(Parent && "Block has no byte interval!");
    return bytes_end<T>(Parent->getBoostEndianOrder());
  }

  /// \brief Get an iterator past the last byte in this block.
  ///
  /// If this block is not associated with any \ref ByteInterval, than the
  /// behavior of this function is undefined.
  ///
  /// \tparam T The type of data stored in this block's byte vector. Must be
  /// a POD type that satisfies Boost's EndianReversible concept.
  ///
  /// \param  InputOrder  The endianness of the data in the block.
  /// \param  OutputOrder The endianness you wish to read out from the block.
  template <typename T>
  bytes_iterator<T>
  bytes_end(boost::endian::order InputOrder,
            boost::endian::order OutputOrder = boost::endian::order::native) {
    assert(Parent && "Block has no byte interval!");
    return Parent->bytes_begin<T>(InputOrder, OutputOrder) + getOffset() + Size;
  }

  /// \brief Get a range of the bytes in this block.
  ///
  /// If this block is not associated with any \ref ByteInterval, than the
  /// behavior of this function is undefined.
  ///
  /// \tparam T The type of data stored in this block's byte vector. Must be
  /// a POD type that satisfies Boost's EndianReversible concept.
  template <typename T> bytes_range<T> bytes() {
    assert(Parent && "Block has no byte interval!");
    return bytes<T>(Parent->getBoostEndianOrder());
  }

  /// \brief Get a range of the bytes in this block.
  ///
  /// If this block is not associated with any \ref ByteInterval, than the
  /// behavior of this function is undefined.
  ///
  /// \tparam T The type of data stored in this block's byte vector. Must be
  /// a POD type that satisfies Boost's EndianReversible concept.
  ///
  /// \param  InputOrder  The endianness of the data in the block.
  /// \param  OutputOrder The endianness you wish to read out from the block.
  template <typename T>
  bytes_range<T>
  bytes(boost::endian::order InputOrder,
        boost::endian::order OutputOrder = boost::endian::order::native) {
    assert(Parent && "Block has no byte interval!");
    return bytes_range<T>(bytes_begin<T>(InputOrder, OutputOrder),
                          bytes_end<T>(InputOrder, OutputOrder));
  }

  /// \brief Get an iterator to the first byte in this block.
  ///
  /// If this block is not associated with any \ref ByteInterval, than the
  /// behavior of this function is undefined.
  ///
  /// \tparam T The type of data stored in this block's byte vector. Must be
  /// a POD type that satisfies Boost's EndianReversible concept.
  template <typename T> const_bytes_iterator<T> bytes_begin() const {
    assert(Parent && "Block has no byte interval!");
    return bytes_begin<T>(Parent->getBoostEndianOrder());
  }

  /// \brief Get an iterator to the first byte in this block.
  ///
  /// If this block is not associated with any \ref ByteInterval, than the
  /// behavior of this function is undefined.
  ///
  /// \tparam T The type of data stored in this block's byte vector. Must be
  /// a POD type that satisfies Boost's EndianReversible concept.
  ///
  /// \param  InputOrder  The endianness of the data in the block.
  /// \param  OutputOrder The endianness you wish to read out from the block.
  template <typename T>
  const_bytes_iterator<T> bytes_begin(
      boost::endian::order InputOrder,
      boost::endian::order OutputOrder = boost::endian::order::native) const {
    assert(Parent && "Block has no byte interval!");
    return Parent->bytes_begin<T>(InputOrder, OutputOrder) + getOffset();
  }

  /// \brief Get an iterator past the last byte in this block.
  ///
  /// If this block is not associated with any \ref ByteInterval, than the
  /// behavior of this function is undefined.
  ///
  /// \tparam T The type of data stored in this block's byte vector. Must be
  /// a POD type that satisfies Boost's EndianReversible concept.
  template <typename T> const_bytes_iterator<T> bytes_end() const {
    assert(Parent && "Block has no byte interval!");
    return bytes_end<T>(Parent->getBoostEndianOrder());
  }

  /// \brief Get an iterator past the last byte in this block.
  ///
  /// If this block is not associated with any \ref ByteInterval, than the
  /// behavior of this function is undefined.
  ///
  /// \tparam T The type of data stored in this block's byte vector. Must be
  /// a POD type that satisfies Boost's EndianReversible concept.
  ///
  /// \param  InputOrder  The endianness of the data in the block.
  /// \param  OutputOrder The endianness you wish to read out from the block.
  template <typename T>
  const_bytes_iterator<T> bytes_end(
      boost::endian::order InputOrder,
      boost::endian::order OutputOrder = boost::endian::order::native) const {
    assert(Parent && "Block has no byte interval!");
    return Parent->bytes_begin<T>(InputOrder, OutputOrder) + getOffset() + Size;
  }

  /// \brief Get a range of the bytes in this block.
  ///
  /// If this block is not associated with any \ref ByteInterval, than the
  /// behavior of this function is undefined.
  ///
  /// \tparam T The type of data stored in this block's byte vector. Must be
  /// a POD type that satisfies Boost's EndianReversible concept.
  template <typename T> const_bytes_range<T> bytes() const {
    assert(Parent && "Block has no byte interval!");
    return bytes<T>(Parent->getBoostEndianOrder());
  }

  /// \brief Get a range of the bytes in this block.
  ///
  /// If this block is not associated with any \ref ByteInterval, than the
  /// behavior of this function is undefined.
  ///
  /// \tparam T The type of data stored in this block's byte vector. Must be
  /// a POD type that satisfies Boost's EndianReversible concept.
  ///
  /// \param  InputOrder  The endianness of the data in the block.
  /// \param  OutputOrder The endianness you wish to read out from the block.
  template <typename T>
  const_bytes_range<T>
  bytes(boost::endian::order InputOrder,
        boost::endian::order OutputOrder = boost::endian::order::native) const {
    assert(Parent && "Block has no byte interval!");
    return const_bytes_range<T>(bytes_begin<T>(InputOrder, OutputOrder),
                                bytes_end<T>(InputOrder, OutputOrder));
  }

  /// \brief Return the raw data underlying this block's byte vector.
  ///
  /// If this block is not associated with any \ref ByteInterval, than the
  /// behavior of this function is undefined.
  ///
  /// Much like \ref std::vector::data, this function is low-level and
  /// potentially unsafe. This pointer refers to valid memory only where an
  /// iterator would be valid to point to. Modifying the size of the byte
  /// vector may invalidate this pointer. Any endian conversions will not be
  /// performed.
  ///
  /// \tparam T The type of data stored in this block's byte vector. Must be
  /// a POD type.
  ///
  /// \retrurn A pointer to raw data.
  template <typename T> T* rawBytes() {
    assert(Parent && "Block has no byte interval!");
    return reinterpret_cast<T*>(Parent->rawBytes<uint8_t>() + getOffset());
  }

  /// \brief Return the raw data underlying this block's byte vector.
  ///
  /// If this block is not associated with any \ref ByteInterval, than the
  /// behavior of this function is undefined.
  ///
  /// Much like \ref std::vector::data, this function is low-level and
  /// potentially unsafe. This pointer refers to valid memory only where an
  /// iterator would be valid to point to. Modifying the size of the byte
  /// vector may invalidate this pointer. Any endian conversions will not be
  /// performed.
  ///
  /// \tparam T The type of data stored in this block's byte vector. Must be
  /// a POD type.
  ///
  /// \retrurn A pointer to raw data.
  template <typename T> const T* rawBytes() const {
    assert(Parent && "Block has no byte interval!");
    return reinterpret_cast<const T*>(Parent->rawBytes<uint8_t>() +
                                      getOffset());
  }

  /// @cond INTERNAL
  static bool classof(const Node* N) { return N->getKind() == Kind::CodeBlock; }
  /// @endcond

private:
  CodeBlock(Context& C) : CfgNode(C, Kind::CodeBlock) {}
  CodeBlock(Context& C, uint64_t S, gtirb::DecodeMode DMode)
      : CfgNode(C, Kind::CodeBlock), Size(S), DecodeMode(DMode) {}
  CodeBlock(Context& C, uint64_t S, gtirb::DecodeMode DMode, const UUID& U)
      : CfgNode(C, Kind::CodeBlock, U), Size(S), DecodeMode(DMode) {}

  void setParent(ByteInterval* BI, CodeBlockObserver* O) {
    Parent = BI;
    Observer = O;
  }

  static CodeBlock* Create(Context& C, uint64_t Size, gtirb::DecodeMode DMode,
                           const UUID& U) {
    return C.Create<CodeBlock>(C, Size, DMode, U);
  }

  /// \brief The protobuf message type used for serializing CodeBlock.
  using MessageType = proto::CodeBlock;

  /// \brief Serialize into a protobuf message.
  ///
  /// \param[out] Message   Serialize into this message.
  ///
  /// \return void
  void toProtobuf(MessageType* Message) const;

  /// \brief Construct a CodeBlock from a protobuf message.
  ///
  /// \param C  The Context in which the deserialized CodeBlock will be held.
  /// \param Message  The protobuf message from which to deserialize.
  ///
  /// \return The deserialized CodeBlock object, or null on failure.
  static ErrorOr<CodeBlock*> fromProtobuf(Context& C,
                                          const MessageType& Message);

  // Present for testing purposes only.
  void save(std::ostream& Out) const;

  // Present for testing purposes only.
  static CodeBlock* load(Context& C, std::istream& In);

  ByteInterval* Parent{nullptr};
  CodeBlockObserver* Observer{nullptr};
  uint64_t Size{0};
  gtirb::DecodeMode DecodeMode{DecodeMode::Default};

  friend class Context;      // Enables Context::Create
  friend class ByteInterval; // Enables to/fromProtobuf, setByteInterval
  friend class SerializationTestHarness; // Testing support.
};

} // namespace gtirb

#endif // GTIRB_BLOCK_H


================================================
FILE: include/gtirb/Context.hpp
================================================
//===- Context.hpp ----------------------------------------------*- C++ -*-===//
//
//  Copyright (C) 2020 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
#ifndef GTIRB_CONTEXT_H
#define GTIRB_CONTEXT_H

#include <gtirb/Allocator.hpp>
#include <gtirb/Export.hpp>
#include <boost/functional/hash.hpp>
#include <boost/uuid/uuid.hpp>
#include <boost/uuid/uuid_hash.hpp>
#include <cstdlib>
#include <functional>
#include <map>

/// \file Context.hpp
/// \brief Class \ref gtirb::Context and related operators.

namespace gtirb {

/// \brief Represents a universally unique identifier used to identify Node
/// objects across serialization boundaries.
///
/// \see Node
/// \see Context
using UUID = boost::uuids::uuid;

class Node;
class CfgNode;
class ByteInterval;
class CodeBlock;
class DataBlock;
class IR;
class Module;
class ProxyBlock;
class Section;
class Symbol;

/// \class Context
///
/// \brief The context under which GTIRB operations occur.
///
/// This object is responsible for holding serialization and
/// serialization state, allowing for control over when Node memory
/// can be released and providing a mechanism for ensuring thread
/// safety.
///
/// Any API that requires a \ref Context object may potentially
/// allocate memory within that context. Destroying the Context object
/// will release that memory.  In a multithreaded environment, sharing
/// a Context object across multiple threads can introduce data races,
/// so protecting the object with a locking primitive is recommended.
class GTIRB_EXPORT_API Context {
  // Note: this must be declared first so it outlives the allocators. They
  // will access the UuidMap during their destructors to unregister nodes.
  std::map<UUID, Node*> UuidMap;

  // Allocate each node type in a separate arena.
  mutable SpecificBumpPtrAllocator<Node> NodeAllocator;
  mutable SpecificBumpPtrAllocator<ByteInterval> ByteIntervalAllocator;
  mutable SpecificBumpPtrAllocator<CodeBlock> CodeBlockAllocator;
  mutable SpecificBumpPtrAllocator<DataBlock> DataBlockAllocator;
  mutable SpecificBumpPtrAllocator<IR> IrAllocator;
  mutable SpecificBumpPtrAllocator<Module> ModuleAllocator;
  mutable SpecificBumpPtrAllocator<ProxyBlock> ProxyBlockAllocator;
  mutable SpecificBumpPtrAllocator<Section> SectionAllocator;
  mutable SpecificBumpPtrAllocator<Symbol> SymbolAllocator;

  /// \copybrief gtirb::Node
  friend class Node;

  void registerNode(const UUID& ID, Node* N) { UuidMap[ID] = N; }

  void unregisterNode(const Node* N);
  const Node* findNode(const UUID& ID) const;
  Node* findNode(const UUID& ID);

  /// \brief Allocates a chunk of memory for an object of type \ref T.
  ///
  /// \tparam T   The type of object for which to allocate memory.
  ///
  /// \return The newly allocated memory, suitably sized for the given
  /// type. Will return nullptr if the allocation cannot be honored.
  template <class T> void* Allocate() const;

  /// \brief Deallocates memory allocated through a call to Allocate().
  ///
  /// \return void
  ///
  /// Deallocation of individual pointers leads to memory fragmentation, which
  /// is why this function is currently a placeholder that does not actually
  /// perform the deallocation. Instead, memory is freed as a whole when the
  /// \ref Context object is destroyed.
  void Deallocate(void*, size_t) const {
    // Noop -- we don't want callers to deallocate individual allocations, but
    // should instead deallocate the entire Context object to free memory.
  }

public:
  Context();
  ~Context();

  /// \brief Forgets all arena allocations held by this \ref Context object.
  /// This can be useful under circumstances where leaking the memory is
  /// acceptable, such as when shutting a program down.
  void ForgetAllocations();

  /// \brief Create an object of type \ref T.
  ///
  /// \tparam NodeTy   The type of object for which to allocate memory.
  /// \tparam Args     The types of the constructor arguments.
  /// \param TheArgs   The constructor arguments.
  ///
  /// \return A newly created object, allocated within the Context.
  template <typename NodeTy, typename... Args>
  NodeTy* Create(Args&&... TheArgs) {
    return new (Allocate<NodeTy>()) NodeTy(std::forward<Args>(TheArgs)...);
  }
};

template <> GTIRB_EXPORT_API void* Context::Allocate<Node>() const;
template <> GTIRB_EXPORT_API void* Context::Allocate<ByteInterval>() const;
template <> GTIRB_EXPORT_API void* Context::Allocate<CodeBlock>() const;
template <> GTIRB_EXPORT_API void* Context::Allocate<DataBlock>() const;
template <> GTIRB_EXPORT_API void* Context::Allocate<IR>() const;
template <> GTIRB_EXPORT_API void* Context::Allocate<Module>() const;
template <> GTIRB_EXPORT_API void* Context::Allocate<ProxyBlock>() const;
template <> GTIRB_EXPORT_API void* Context::Allocate<Section>() const;
template <> GTIRB_EXPORT_API void* Context::Allocate<Symbol>() const;

} // namespace gtirb

#endif // GTIRB_CONTEXT_H


================================================
FILE: include/gtirb/DataBlock.hpp
================================================
//===- DataBlock.hpp --------------------------------------------*- C++ -*-===//
//
//  Copyright (C) 2020 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
#ifndef GTIRB_DataBlock_H
#define GTIRB_DataBlock_H

#include <gtirb/Addr.hpp>
#include <gtirb/ByteInterval.hpp>
#include <gtirb/Node.hpp>
#include <cstdint>
#include <functional>
#include <optional>
#include <vector>

/// \file DataBlock.hpp
/// \brief Class gtirb::DataBlock.

namespace gtirb {
namespace proto {
class DataBlock;
}

template <class T> class ErrorOr;

///
/// \class DataBlock
///
/// \brief Represents a data object, possibly symbolic.
///
/// Does not directly store the data bytes, which are kept in the
/// \ref ImageByteMap.
///
class GTIRB_EXPORT_API DataBlock : public Node {
  DataBlock(Context& C) : Node(C, Kind::DataBlock) {}
  DataBlock(Context& C, uint64_t S, const UUID& U)
      : Node(C, Kind::DataBlock, U), Size(S) {}
  DataBlock(Context& C, uint64_t S) : Node(C, Kind::DataBlock), Size(S) {}

  static DataBlock* Create(Context& C, uint64_t S, const UUID& U) {
    return C.Create<DataBlock>(C, S, U);
  }

public:
  /// \brief Create an unitialized DataBlock object.
  /// \param C        The Context in which this DataBlock will be held.
  /// \return         The newly created DataBlock.
  static DataBlock* Create(Context& C) { return C.Create<DataBlock>(C); }

  /// \brief Create a DataBlock object.
  ///
  /// \param C        The Context in which the newly-created DataBlock will be
  /// \param Size     The size of the object in bytes.
  /// \return The newly created DataBlock.
  static DataBlock* Create(Context& C, uint64_t Size) {
    return C.Create<DataBlock>(C, Size);
  }

  /// \brief Get the \ref ByteInterval this block belongs to.
  ByteInterval* getByteInterval() { return Parent; }
  /// \brief Get the \ref ByteInterval this block belongs to.
  const ByteInterval* getByteInterval() const { return Parent; }

  /// \brief Get the size of a DataBlock.
  ///
  /// \return The size.
  ///
  uint64_t getSize() const { return Size; }

  /// \brief Get the offset from the beginning of the \ref ByteInterval this
  /// block belongs to.
  uint64_t getOffset() const;

  /// \brief Get the address of this block, if present. See \ref
  /// ByteInterval.getAddress for details on why this address may not be
  /// present.
  std::optional<Addr> getAddress() const;

  /// \brief Set the size of this block.
  ///
  /// Note that this does not automatically update any \ref ByteInterval's size,
  /// bytes, or symbolic expressions. This simply changes the extents of a block
  /// in its \ref ByteInterval.
  void setSize(uint64_t S) {
    if (Observer) {
      std::swap(S, Size);
      [[maybe_unused]] ChangeStatus Status =
          Observer->sizeChange(this, S, Size);
      assert(Status != ChangeStatus::Rejected &&
             "recovering from rejected size change is not implemented yet");
    } else {
      Size = S;
    }
  }

  /// \brief Iterator over bytes in this block.
  ///
  /// \tparam T The type of data stored in this block's byte vector. Must be
  /// a POD type that satisfies Boost's EndianReversible concept.
  template <typename T> using bytes_iterator = ByteInterval::bytes_iterator<T>;
  /// \brief Range over bytes in this block.
  ///
  /// \tparam T The type of data stored in this block's byte vector. Must be
  /// a POD type that satisfies Boost's EndianReversible concept.
  template <typename T> using bytes_range = ByteInterval::bytes_range<T>;
  /// \brief Const iterator over bytes in this block.
  ///
  /// \tparam T The type of data stored in this block's byte vector. Must be
  /// a POD type that satisfies Boost's EndianReversible concept.
  template <typename T>
  using const_bytes_iterator = ByteInterval::const_bytes_iterator<T>;
  /// \brief Const range over bytes in this block.
  ///
  /// \tparam T The type of data stored in this block's byte vector. Must be
  /// a POD type that satisfies Boost's EndianReversible concept.
  template <typename T>
  using const_bytes_range = ByteInterval::const_bytes_range<T>;

  /// \brief Get an iterator to the first byte in this block.
  ///
  /// If this block is not associated with any \ref ByteInterval, than the
  /// behavior of this function is undefined.
  ///
  /// \tparam T The type of data stored in this block's byte vector. Must be
  /// a POD type that satisfies Boost's EndianReversible concept.
  template <typename T> bytes_iterator<T> bytes_begin() {
    assert(Parent && "Block has no byte interval!");
    return bytes_begin<T>(Parent->getBoostEndianOrder());
  }

  /// \brief Get an iterator to the first byte in this block.
  ///
  /// If this block is not associated with any \ref ByteInterval, than the
  /// behavior of this function is undefined.
  ///
  /// \tparam T The type of data stored in this block's byte vector. Must be
  /// a POD type that satisfies Boost's EndianReversible concept.
  ///
  /// \param  InputOrder  The endianness of the data in the block.
  /// \param  OutputOrder The endianness you wish to read out from the block.
  template <typename T>
  bytes_iterator<T>
  bytes_begin(boost::endian::order InputOrder,
              boost::endian::order OutputOrder = boost::endian::order::native) {
    assert(Parent && "Block has no byte interval!");
    return Parent->bytes_begin<T>(InputOrder, OutputOrder) + getOffset();
  }

  /// \brief Get an iterator past the last byte in this block.
  ///
  /// If this block is not associated with any \ref ByteInterval, than the
  /// behavior of this function is undefined.
  ///
  /// \tparam T The type of data stored in this block's byte vector. Must be
  /// a POD type that satisfies Boost's EndianReversible concept.
  template <typename T> bytes_iterator<T> bytes_end() {
    assert(Parent && "Block has no byte interval!");
    return bytes_end<T>(Parent->getBoostEndianOrder());
  }

  /// \brief Get an iterator past the last byte in this block.
  ///
  /// If this block is not associated with any \ref ByteInterval, than the
  /// behavior of this function is undefined.
  ///
  /// \tparam T The type of data stored in this block's byte vector. Must be
  /// a POD type that satisfies Boost's EndianReversible concept.
  ///
  /// \param  InputOrder  The endianness of the data in the block.
  /// \param  OutputOrder The endianness you wish to read out from the block.
  template <typename T>
  bytes_iterator<T>
  bytes_end(boost::endian::order InputOrder,
            boost::endian::order OutputOrder = boost::endian::order::native) {
    assert(Parent && "Block has no byte interval!");
    return Parent->bytes_begin<T>(InputOrder, OutputOrder) + getOffset() + Size;
  }

  /// \brief Get a range of the bytes in this block.
  ///
  /// If this block is not associated with any \ref ByteInterval, than the
  /// behavior of this function is undefined.
  ///
  /// \tparam T The type of data stored in this block's byte vector. Must be
  /// a POD type that satisfies Boost's EndianReversible concept.
  template <typename T> bytes_range<T> bytes() {
    assert(Parent && "Block has no byte interval!");
    return bytes<T>(Parent->getBoostEndianOrder());
  }

  /// \brief Get a range of the bytes in this block.
  ///
  /// If this block is not associated with any \ref ByteInterval, than the
  /// behavior of this function is undefined.
  ///
  /// \tparam T The type of data stored in this block's byte vector. Must be
  /// a POD type that satisfies Boost's EndianReversible concept.
  ///
  /// \param  InputOrder  The endianness of the data in the block.
  /// \param  OutputOrder The endianness you wish to read out from the block.
  template <typename T>
  bytes_range<T>
  bytes(boost::endian::order InputOrder,
        boost::endian::order OutputOrder = boost::endian::order::native) {
    assert(Parent && "Block has no byte interval!");
    return bytes_range<T>(bytes_begin<T>(InputOrder, OutputOrder),
                          bytes_end<T>(InputOrder, OutputOrder));
  }

  /// \brief Get an iterator to the first byte in this block.
  ///
  /// If this block is not associated with any \ref ByteInterval, than the
  /// behavior of this function is undefined.
  ///
  /// \tparam T The type of data stored in this block's byte vector. Must be
  /// a POD type that satisfies Boost's EndianReversible concept.
  template <typename T> const_bytes_iterator<T> bytes_begin() const {
    assert(Parent && "Block has no byte interval!");
    return bytes_begin<T>(Parent->getBoostEndianOrder());
  }

  /// \brief Get an iterator to the first byte in this block.
  ///
  /// If this block is not associated with any \ref ByteInterval, than the
  /// behavior of this function is undefined.
  ///
  /// \tparam T The type of data stored in this block's byte vector. Must be
  /// a POD type that satisfies Boost's EndianReversible concept.
  ///
  /// \param  InputOrder  The endianness of the data in the block.
  /// \param  OutputOrder The endianness you wish to read out from the block.
  template <typename T>
  const_bytes_iterator<T> bytes_begin(
      boost::endian::order InputOrder,
      boost::endian::order OutputOrder = boost::endian::order::native) const {
    assert(Parent && "Block has no byte interval!");
    return Parent->bytes_begin<T>(InputOrder, OutputOrder) + getOffset();
  }

  /// \brief Get an iterator past the last byte in this block.
  ///
  /// If this block is not associated with any \ref ByteInterval, than the
  /// behavior of this function is undefined.
  ///
  /// \tparam T The type of data stored in this block's byte vector. Must be
  /// a POD type that satisfies Boost's EndianReversible concept.
  template <typename T> const_bytes_iterator<T> bytes_end() const {
    assert(Parent && "Block has no byte interval!");
    return bytes_end<T>(Parent->getBoostEndianOrder());
  }

  /// \brief Get an iterator past the last byte in this block.
  ///
  /// If this block is not associated with any \ref ByteInterval, than the
  /// behavior of this function is undefined.
  ///
  /// \tparam T The type of data stored in this block's byte vector. Must be
  /// a POD type that satisfies Boost's EndianReversible concept.
  ///
  /// \param  InputOrder  The endianness of the data in the block.
  /// \param  OutputOrder The endianness you wish to read out from the block.
  template <typename T>
  const_bytes_iterator<T> bytes_end(
      boost::endian::order InputOrder,
      boost::endian::order OutputOrder = boost::endian::order::native) const {
    assert(Parent && "Block has no byte interval!");
    return Parent->bytes_begin<T>(InputOrder, OutputOrder) + getOffset() + Size;
  }

  /// \brief Get a range of the bytes in this block.
  ///
  /// If this block is not associated with any \ref ByteInterval, than the
  /// behavior of this function is undefined.
  ///
  /// \tparam T The type of data stored in this block's byte vector. Must be
  /// a POD type that satisfies Boost's EndianReversible concept.
  template <typename T> const_bytes_range<T> bytes() const {
    assert(Parent && "Block has no byte interval!");
    return bytes<T>(Parent->getBoostEndianOrder());
  }

  /// \brief Get a range of the bytes in this block.
  ///
  /// If this block is not associated with any \ref ByteInterval, than the
  /// behavior of this function is undefined.
  ///
  /// \tparam T The type of data stored in this block's byte vector. Must be
  /// a POD type that satisfies Boost's EndianReversible concept.
  ///
  /// \param  InputOrder  The endianness of the data in the block.
  /// \param  OutputOrder The endianness you wish to read out from the block.
  template <typename T>
  const_bytes_range<T>
  bytes(boost::endian::order InputOrder,
        boost::endian::order OutputOrder = boost::endian::order::native) const {
    assert(Parent && "Block has no byte interval!");
    return const_bytes_range<T>(bytes_begin<T>(InputOrder, OutputOrder),
                                bytes_end<T>(InputOrder, OutputOrder));
  }

  /// \brief Return the raw data underlying this block's byte vector.
  ///
  /// If this block is not associated with any \ref ByteInterval, than the
  /// behavior of this function is undefined.
  ///
  /// Much like \ref std::vector::data, this function is low-level and
  /// potentially unsafe. This pointer refers to valid memory only where an
  /// iterator would be valid to point to. Modifying the size of the byte
  /// vector may invalidate this pointer. Any endian conversions will not be
  /// performed.
  ///
  /// \tparam T The type of data stored in this block's byte vector. Must be
  /// a POD type.
  ///
  /// \retrurn A pointer to raw data.
  template <typename T> T* rawBytes() {
    assert(Parent && "Block has no byte interval!");
    return reinterpret_cast<T*>(Parent->rawBytes<uint8_t>() + getOffset());
  }

  /// \brief Return the raw data underlying this block's byte vector.
  ///
  /// If this block is not associated with any \ref ByteInterval, than the
  /// behavior of this function is undefined.
  ///
  /// Much like \ref std::vector::data, this function is low-level and
  /// potentially unsafe. This pointer refers to valid memory only where an
  /// iterator would be valid to point to. Modifying the size of the byte
  /// vector may invalidate this pointer. Any endian conversions will not be
  /// performed.
  ///
  /// \tparam T The type of data stored in this block's byte vector. Must be
  /// a POD type.
  ///
  /// \retrurn A pointer to raw data.
  template <typename T> const T* rawBytes() const {
    assert(Parent && "Block has no byte interval!");
    return reinterpret_cast<const T*>(Parent->rawBytes<uint8_t>() +
                                      getOffset());
  }

  /// @cond INTERNAL
  static bool classof(const Node* N) { return N->getKind() == Kind::DataBlock; }
  /// @endcond

private:
  ByteInterval* Parent{nullptr};
  DataBlockObserver* Observer{nullptr};
  uint64_t Size{0};

  void setParent(ByteInterval* BI, DataBlockObserver* O) {
    Parent = BI;
    Observer = O;
  }

  /// \brief The protobuf message type used for serializing DataBlock.
  using MessageType = proto::DataBlock;

  /// \brief Serialize into a protobuf message.
  ///
  /// \param[out] Message   Serialize into this message.
  ///
  /// \return void
  void toProtobuf(MessageType* Message) const;

  /// \brief Construct a DataBlock from a protobuf message.
  ///
  /// \param C   The Context in which the deserialized DataBlock will be held.
  /// \param Message  The protobuf message from which to deserialize.
  ///
  /// \return The deserialized DataBlock object, or null on failure.
  static ErrorOr<DataBlock*> fromProtobuf(Context& C,
                                          const MessageType& Message);

  // Present for testing purposes only.
  void save(std::ostream& Out) const;

  // Present for testing purposes only.
  static DataBlock* load(Context& C, std::istream& In);

  friend class Context;      // Enables Context::Create
  friend class ByteInterval; // Enables to/fromProtobuf, setByteInterval
  friend class SerializationTestHarness; // Testing support.
};
} // namespace gtirb

#endif // GTIRB_DataBlock_H


================================================
FILE: include/gtirb/DecodeMode.hpp
================================================
//===- DecodeMode.hpp --------------------------------------------*- C++-*-===//
//
//  Copyright (C) 2024 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
#ifndef GTIRB_DECODE_MODE_H
#define GTIRB_DECODE_MODE_H

#include <gtirb/proto/CodeBlock.pb.h>
#include <cstdint>

namespace gtirb {

/// \enum DecodeMode
///
/// \brief Variations on decoding a particular ISA
enum class DecodeMode : uint8_t {
  Default = proto::All_Default, ///< Default decode mode for all ISAs
  Thumb = proto::ARM_Thumb,     ///< Thumb decode mode for ARM32
};

} // namespace gtirb

#endif // GTIRB_DECODE_MODE_H


================================================
FILE: include/gtirb/ErrorOr.hpp
================================================
//===- ErrorOr.hpp ----------------------------------------------*- C++ -*-===//
//
//  Copyright (C) 2020 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===-Addition License Information-----------------------------------------===//
//
// This file was initially written for the LLVM Compiler Infrastructure
// project where it is distributed under the Apache License v2.0 with LLVM
// Exceptions. See the LICENSE file in the project root for license terms.
//
//===----------------------------------------------------------------------===//

#ifndef GTIRB_ERROROR_H
#define GTIRB_ERROROR_H

#include <gtirb/Export.hpp>
#include <cassert>
#include <iostream>
#include <system_error>
#include <type_traits>
#include <utility>

namespace gtirb {

/// A small struct to hold an error code
/// along with a string holding additional details
struct GTIRB_EXPORT_API ErrorInfo {
  std::error_code ErrorCode;
  std::string Msg;
  ErrorInfo() = default;
  ErrorInfo(const std::error_code& EC, const std::string& S)
      : ErrorCode(EC), Msg(S){};
  std::string message() const;
};

template <typename CharT, typename Traits>
std::ostream& operator<<(std::basic_ostream<CharT, Traits>& os,
                         const ErrorInfo& Info) {
  os << Info.ErrorCode.message() << " " << Info.Msg;
  return os;
}

/// Represents either an error or a value T.
///
/// ErrorOr<T> is a pointer-like class that represents the result of an
/// operation. The result is either an error, or a value of type T. This is
/// designed to emulate the usage of returning a pointer where nullptr indicates
/// failure. However instead of just knowing that the operation failed, we also
/// have an error_code and optional user data that describes why it failed.
///
/// It is used like the following.
/// \code
///   ErrorOr<Buffer> getBuffer();
///
///   auto buffer = getBuffer();
///   if (error_code ec = buffer.getError())
///     return ec;
///   buffer->write("adena");
/// \endcode
///
///
/// Implicit conversion to bool returns true if there is a usable value. The
/// unary * and -> operators provide pointer like access to the value. Accessing
/// the value when there is an error has undefined behavior.
///
/// When T is a reference type the behavior is slightly different. The reference
/// is held in a std::reference_wrapper<std::remove_reference<T>::type>, and
/// there is special handling to make operator -> work as if T was not a
/// reference.
///
/// T cannot be a rvalue reference.
template <class T> class ErrorOr {
  template <class OtherT> friend class ErrorOr;

  static constexpr bool isRef = std::is_reference<T>::value;

  using wrap = std::reference_wrapper<std::remove_reference_t<T>>;

public:
  using storage_type = std::conditional_t<isRef, wrap, T>;

private:
  using reference = std::remove_reference_t<T>&;
  using const_reference = const std::remove_reference_t<T>&;
  using pointer = std::remove_reference_t<T>*;
  using const_pointer = const std::remove_reference_t<T>*;

public:
  template <class E>
  ErrorOr(E ErrorCode, const std::string& Msg = "",
          std::enable_if_t<std::is_error_code_enum<E>::value ||
                               std::is_error_condition_enum<E>::value,
                           void*> = nullptr)
      : HasError(true) {
    new (getErrorStorage()) ErrorInfo{make_error_code(ErrorCode), Msg};
  }

  ErrorOr(std::error_code EC, const std::string& Msg = "") : HasError(true) {
    new (getErrorStorage()) ErrorInfo{EC, Msg};
  }

  ErrorOr(const ErrorInfo& EI) : HasError(true) {
    new (getErrorStorage()) ErrorInfo(EI);
  }

  template <class OtherT>
  ErrorOr(OtherT&& Val,
          std::enable_if_t<std::is_convertible<OtherT, T>::value>* = nullptr)
      : HasError(false) {
    new (getStorage()) storage_type(std::forward<OtherT>(Val));
  }

  ErrorOr(const ErrorOr& Other) { copyConstruct(Other); }

  template <class OtherT>
  ErrorOr(const ErrorOr<OtherT>& Other,
          std::enable_if_t<std::is_convertible<OtherT, T>::value>* = nullptr) {
    copyConstruct(Other);
  }

  template <class OtherT>
  explicit ErrorOr(
      const ErrorOr<OtherT>& Other,
      std::enable_if_t<!std::is_convertible<OtherT, const T&>::value>* =
          nullptr) {
    copyConstruct(Other);
  }

  ErrorOr(ErrorOr&& Other) { moveConstruct(std::move(Other)); }

  template <class OtherT>
  ErrorOr(ErrorOr<OtherT>&& Other,
          std::enable_if_t<std::is_convertible<OtherT, T>::value>* = nullptr) {
    moveConstruct(std::move(Other));
  }

  // This might eventually need SFINAE but it's more complex than is_convertible
  // & I'm too lazy to write it right now.
  template <class OtherT>
  explicit ErrorOr(
      ErrorOr<OtherT>&& Other,
      std::enable_if_t<!std::is_convertible<OtherT, T>::value>* = nullptr) {
    moveConstruct(std::move(Other));
  }

  ErrorOr& operator=(const ErrorOr& Other) {
    copyAssign(Other);
    return *this;
  }

  ErrorOr& operator=(ErrorOr&& Other) {
    moveAssign(std::move(Other));
    return *this;
  }

  ~ErrorOr() {
    if (!HasError)
      getStorage()->~storage_type();
  }

  /// Return false if there is an error.
  explicit operator bool() const { return !HasError; }

  reference get() { return *getStorage(); }
  const_reference get() const { return const_cast<ErrorOr<T>*>(this)->get(); }

  ErrorInfo getError() const {
    return HasError ? *getErrorStorage() : ErrorInfo();
  }

  pointer operator->() { return toPointer(getStorage()); }

  const_pointer operator->() const { return toPointer(getStorage()); }

  reference operator*() { return *getStorage(); }

  const_reference operator*() const { return *getStorage(); }

private:
  template <class OtherT> void copyConstruct(const ErrorOr<OtherT>& Other) {
    if (!Other.HasError) {
      // Get the other value.
      HasError = false;
      new (getStorage()) storage_type(*Other.getStorage());
    } else {
      // Get other's error.
      HasError = true;
      new (getErrorStorage()) ErrorInfo(Other.getError());
    }
  }

  template <class T1>
  static bool compareThisIfSameType(const T1& a, const T1& b) {
    return &a == &b;
  }

  template <class T1, class T2>
  static bool compareThisIfSameType(const T1&, const T2&) {
    return false;
  }

  template <class OtherT> void copyAssign(const ErrorOr<OtherT>& Other) {
    if (compareThisIfSameType(*this, Other))
      return;

    this->~ErrorOr();
    new (this) ErrorOr(Other);
  }

  template <class OtherT> void moveConstruct(ErrorOr<OtherT>&& Other) {
    if (!Other.HasError) {
      // Get the other value.
      HasError = false;
      new (getStorage()) storage_type(std::move(*Other.getStorage()));
    } else {
      // Get other's error.
      HasError = true;
      new (getErrorStorage()) ErrorInfo(std::move(*Other.getErrorStorage()));
    }
  }

  template <class OtherT> void moveAssign(ErrorOr<OtherT>&& Other) {
    if (compareThisIfSameType(*this, Other))
      return;

    this->~ErrorOr();
    new (this) ErrorOr(std::move(Other));
  }

  pointer toPointer(pointer Val) { return Val; }

  const_pointer toPointer(const_pointer Val) const { return Val; }

  pointer toPointer(wrap* Val) { return &Val->get(); }

  const_pointer toPointer(const wrap* Val) const { return &Val->get(); }

  storage_type* getStorage() {
    assert(!HasError && "Cannot get value when an error exists!");
    return reinterpret_cast<storage_type*>(TStorage);
  }

  const storage_type* getStorage() const {
    assert(!HasError && "Cannot get value when an error exists!");
    return reinterpret_cast<const storage_type*>(TStorage);
  }

  ErrorInfo* getErrorStorage() {
    assert(HasError && "Cannot get error when a value exists!");
    return reinterpret_cast<ErrorInfo*>(ErrorStorage);
  }

  const ErrorInfo* getErrorStorage() const {
    return const_cast<ErrorOr<T>*>(this)->getErrorStorage();
  }

  union {
    alignas(storage_type) char TStorage[sizeof(storage_type)];
    alignas(ErrorInfo) char ErrorStorage[sizeof(ErrorInfo)];
  };
  bool HasError : 1;
};

template <class T, class E>
std::enable_if_t<std::is_error_code_enum<E>::value ||
                     std::is_error_condition_enum<E>::value,
                 bool>
operator==(const ErrorOr<T>& Err, E Code) {
  return Err.getError().ErrorCode == Code;
}
} // end namespace gtirb

#endif // GTIRB_ERROROR_H


================================================
FILE: include/gtirb/Export.hpp
================================================
//===- Export.hpp -----------------------------------------------*- C++ -*-===//
//
//  Copyright (C) 2020 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
#ifndef GTIRB_EXPORT_H
#define GTIRB_EXPORT_H

/// @cond INTERNAL
#ifndef __has_declspec_attribute
#define __has_declspec_attribute(x) 0
#endif

#ifndef __has_attribute
#define __has_attribute(x) 0
#endif
/// @endcond

/// \def GTIRB_EXPORT_API
/// \brief This macro controls the visibility of exported symbols (i.e. classes)
/// in shared libraries. When producing the library, selects symbols to export,
/// and when consuming the library, selects symbols to import.
#if defined(_MSC_VER) || __has_declspec_attribute(dllexport)
// Defined by the build system (CMake or SCons). This should only be defined by
// the build system which generates the GTIRB library. Users of the library
// should NOT define this.
#ifdef GTIRB_gtirb_EXPORTS
#define GTIRB_EXPORT_API _declspec(dllexport)
#else
// Note: We do not have clients explicitly dllimport from the gtirb
// library. GTIRB exports no data symbols. And using dllimport is
// optional for function symbols (dllimport provides only a very
// slight performance improvement on function calls). Using dllimport
// creates a certain amount of headache for Windows clients that may
// want to sometimes statically and sometimes dynamically link against
// GTIRB. The confusion and frustration this creates generally
// outweighs the performance benefit.
#define GTIRB_EXPORT_API
#endif // GTIRB_gtirb_EXPORTS
#elif defined(__GNUC__) || __has_attribute(visibility)
#define GTIRB_EXPORT_API __attribute__((visibility("default")))
#else
#define GTIRB_EXPORT_API
#endif

#endif // GTIRB_EXPORT_H


================================================
FILE: include/gtirb/IR.hpp
================================================
//===- IR.hpp ---------------------------------------------------*- C++ -*-===//
//
//  Copyright (C) 2021 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
#ifndef GTIRB_IR_H
#define GTIRB_IR_H

#include <gtirb/Addr.hpp>
#include <gtirb/AuxData.hpp>
#include <gtirb/AuxDataContainer.hpp>
#include <gtirb/CFG.hpp>
#include <gtirb/ErrorOr.hpp>
#include <gtirb/Module.hpp>
#include <gtirb/Node.hpp>
#include <gtirb/Observer.hpp>
#include <gtirb/Utility.hpp>
#include <gtirb/version.h>
#include <boost/iterator/indirect_iterator.hpp>
#include <boost/multi_index_container.hpp>
#include <boost/range/iterator_range.hpp>
#include <map>
#include <string>
#include <vector>

/// \file IR.hpp
/// \brief Class gtirb::IR.

namespace gtirb {
namespace proto {
class IR;
}
/// \class IR
///
/// \brief A complete internal representation consisting of Modules
/// (\ref Module).
///
/// \dot
/// digraph example {
///     node [shape=record, fontname=Helvetica, fontsize=10];
///
///     ir [ label="IR" URL="\ref IR"];
///     module [ label="Module" URL="\ref Module"];
///     auxData [ label="AuxData" URL="\ref AuxData"];
///     imageByteMap [label="ImageByteMap" URL="\ref ImageByteMap"]
///     blocks [label="Block" URL="\ref Block"]
///     data [label="DataBlock"  URL="\ref DataBlock"]
///     symbolicExpressions  [label="SymbolicExpression"
///                           URL="\ref SymbolicExpression"]
///     sections [label="Section" URL="\ref Section"]
///     symbols [label="Symbol" URL="\ref Symbol"]
///     cfg [label="CFG" URL="\ref CFG"]
///
///     ir -> module;
///     ir -> auxData;
///     module -> cfg;
///     module -> data
///     module -> imageByteMap;
///     module -> sections
///     module -> symbols;
///     module -> symbolicExpressions
///     cfg -> blocks;
/// }
/// \enddot
///

class GTIRB_EXPORT_API IR : public AuxDataContainer {
  IR(Context& C);
  IR(Context& C, const UUID& U);

  static IR* Create(Context& C, const UUID& U) { return C.Create<IR>(C, U); }

  struct by_name {};
  struct by_pointer {};

  using ModuleSet = boost::multi_index::multi_index_container<
      Module*, boost::multi_index::indexed_by<
                   boost::multi_index::ordered_non_unique<
                       boost::multi_index::tag<by_name>,
                       boost::multi_index::const_mem_fun<
                           Module, const std::string&, &Module::getName>>,
                   boost::multi_index::hashed_unique<
                       boost::multi_index::tag<by_pointer>,
                       boost::multi_index::identity<Module*>>>>;

  class ModuleObserverImpl;

public:
  /// \brief Create an IR object in its default state.
  ///
  /// \param C  The Context in which this object will be held.
  ///
  /// \return The newly created object.
  static IR* Create(Context& C) { return C.Create<IR>(C); }

  /// \brief Get the associated Control Flow Graph (\ref CFG).
  ///
  /// \return The associated CFG.
  const CFG& getCFG() const { return Cfg; }

  /// \brief Get a const reference to the associated Control Flow Graph
  /// (\ref CFG).
  ///
  /// \return The associated CFG.
  CFG& getCFG() { return Cfg; }

  /// \name Module-Related Public Types and Functions
  /// @{
  /// \brief Iterator over \ref Module "Modules".
  ///
  /// Modules are returned in name order. If more than one module has the same
  /// name, the order in which they are returned is unspecified.
  using module_iterator = boost::indirect_iterator<ModuleSet::iterator>;
  /// \brief Constant iterator over \ref Module "Modules".
  ///
  /// Modules are returned in name order. If more than one module has the same
  /// name, the order in which they are returned is unspecified.
  using const_module_iterator =
      boost::indirect_iterator<ModuleSet::const_iterator, const Module>;

  /// \brief Returns an iterator to the first Module.
  module_iterator modules_begin() { return Modules.begin(); }
  /// \brief Returns an iterator to the element following the last Module.
  module_iterator modules_end() { return Modules.end(); }
  /// \brief Returns a constant iterator to the first Module.
  const_module_iterator modules_begin() const { return Modules.begin(); }
  /// \brief Returns a constant iterator to the element following the last
  /// Module.
  const_module_iterator modules_end() const { return Modules.end(); }

  /// \brief Range of \ref Module "Modules".
  ///
  /// Modules are returned in name order. If more than one module has the same
  /// name, the order in which they are returned is unspecified.
  using module_range = boost::iterator_range<module_iterator>;
  /// \brief Constant range of \ref Module "Modules".
  ///
  /// Modules are returned in name order. If more than one module has the same
  /// name, the order in which they are returned is unspecified.
  using const_module_range = boost::iterator_range<const_module_iterator>;

  /// \brief Returns a range of the \ref Module "Modules".
  module_range modules() {
    return boost::make_iterator_range(modules_begin(), modules_end());
  }
  /// \brief Returns a constant range of the \ref Module "Modules".
  const_module_range modules() const {
    return boost::make_iterator_range(modules_begin(), modules_end());
  }

  /// \brief Iterator over modules \ref Module "Modules".
  ///
  /// This iterator returns modules in name order. If two modules have the same
  /// name, their order is unspecified.
  using module_name_iterator =
      boost::indirect_iterator<ModuleSet::index<by_name>::type::iterator>;
  /// \brief Range of modules \ref Module "Modules".
  ///
  /// This range returns modules in name order. If two modules have the same
  /// name, their order is unspecified.
  using module_name_range = boost::iterator_range<module_name_iterator>;
  /// \brief Constant iterator over modules \ref Module "Modules".
  ///
  /// This iterator returns modules in name order. If two modules have the same
  /// name, their order is unspecified.
  using const_module_name_iterator =
      boost::indirect_iterator<ModuleSet::index<by_name>::type::const_iterator,
                               const Module>;
  /// \brief Constant range of modules \ref Module "Modules".
  ///
  /// This range returns modules in name order. If two modules have the same
  /// name, their order is unspecified.
  using const_module_name_range =
      boost::iterator_range<const_module_name_iterator>;

  /// \brief Remove a \ref Module object located in this IR.
  ///
  /// \param S The \ref Module object to remove.
  ///
  /// \return Whether or not the operation succeeded. This operation can
  /// fail if the node to remove is not actually part of this node to begin
  /// with.
  bool removeModule(Module* M) {
    auto& Index = Modules.get<by_pointer>();
    if (auto Iter = Index.find(M); Iter != Index.end()) {
      MO->removeProxyBlocks(M, M->proxy_blocks());
      MO->removeCodeBlocks(M, M->code_blocks());
      Index.erase(Iter);
      M->setParent(nullptr, nullptr);
      return true;
    }
    return false;
  }

  /// \brief Move a \ref Module object to be located in this IR.
  ///
  /// \param S The \ref Module object to add.
  Module* addModule(Module* M) {
    if (M->getIR()) {
      M->getIR()->removeModule(M);
    }

    MO->addProxyBlocks(M, M->proxy_blocks());
    MO->addCodeBlocks(M, M->code_blocks());
    Modules.emplace(M);
    M->setParent(this, MO.get());
    return M;
  }

  /// \brief Creates a new \ref Module in this IR.
  ///
  /// \tparam Args  The arguments to construct a \ref Module.
  // FIXME: this API may wind up getting removed because we perhaps want to
  // support creating a Module that is not hooked up to any IR object and then
  // set the parent on the module later. Personally, I think that is a
  // dangerous design choice, but we can argue the merits of both approaches in
  // a code review.
  template <typename... Args> Module* addModule(Context& C, Args... A) {
    return addModule(Module::Create(C, A...));
  }

  /// \brief Find modules by name
  ///
  /// \param N The name to look up.
  ///
  /// \return A possibly empty range of all the modules with the
  /// given name.
  module_name_range findModules(const std::string& N) {
    auto Found = Modules.get<by_name>().equal_range(N);
    return boost::make_iterator_range(Found.first, Found.second);
  }

  /// \brief Find modules by name
  ///
  /// \param N The name to look up.
  ///
  /// \return A possibly empty constant range of all the modules with the
  /// given name.
  const_module_name_range findModules(const std::string& N) const {
    auto Found = Modules.get<by_name>().equal_range(N);
    return boost::make_iterator_range(Found.first, Found.second);
  }

  /// @}
  // (end Module-Related Public Types and Functions)

  /// \brief Serialize to an output stream in binary format.
  ///
  /// \param Out The output stream.
  ///
  /// \return void
  void save(std::ostream& Out) const;

  /// \brief Serialize to an output stream in JSON format.
  ///
  /// \param Out The output stream.
  ///
  /// \return void
  void saveJSON(std::ostream& Out) const;

  /// \enum load_error
  ///
  /// \brief Specifies various failure modes when loading an IR.
  enum class load_error {
    IncorrectVersion = 1, ///< The version number in the file does not match.
    CorruptFile, ///< The content of the file could not be deserialized.
    CorruptModule,
    CorruptSection,
    CorruptByteInterval,
    CorruptCFG,  ///< The control flow graph could not be deserialized
    BadUUID,     ///< An object had an incorrectly formatted UUID
    MissingUUID, ///< A UUID did not refer to an object in the loading Context
    NotGTIRB,    ///< Indicates the GTIRB magic number was not found
  };

  /// \brief Deserialize binary format from an input stream.
  ///
  /// \param C   The Context in which this IR will be loaded.
  /// \param In  The input stream.
  ///
  /// \return The deserialized IR object or an error.
  static ErrorOr<IR*> load(Context& C, std::istream& In);

  /// \brief Deserialize JSON format from an input stream.
  ///
  /// \param C   The Context in which this IR will be loaded.
  /// \param In  The input stream.
  ///
  /// \return The deserialized IR object or an error.
  static ErrorOr<IR*> loadJSON(Context& C, std::istream& In);

  /// \name ProxyBlock-Related Public Types and Functions
  /// @{

  /// \brief Iterator over \ref ProxyBlock objects.
  using proxy_block_iterator = MergeSortedIterator<Module::proxy_block_iterator,
                                                   ArbitraryLess<ProxyBlock>>;
  /// \brief Range over \ref ProxyBlock objects.
  using proxy_block_range = boost::iterator_range<proxy_block_iterator>;
  /// \brief Iterator over \ref ProxyBlock objects.
  using const_proxy_block_iterator =
      MergeSortedIterator<Module::const_proxy_block_iterator,
                          ArbitraryLess<ProxyBlock>>;
  /// \brief Range over \ref ProxyBlock objects.
  using const_proxy_block_range =
      boost::iterator_range<const_proxy_block_iterator>;

  /// \brief Return an iterator to the first \ref ProxyBlock.
  proxy_block_iterator proxy_blocks_begin() {
    return proxy_block_iterator(
        boost::make_transform_iterator(this->modules_begin(),
                                       NodeToProxyBlockRange<Module>()),
        boost::make_transform_iterator(this->modules_end(),
                                       NodeToProxyBlockRange<Module>()));
  }

  /// \brief Return an iterator to the element following the last \ref
  /// ProxyBlock.
  proxy_block_iterator proxy_blocks_end() { return proxy_block_iterator(); }

  /// \brief Return a range of all the \ref ProxyBlock objects.
  proxy_block_range proxy_blocks() {
    return boost::make_iterator_range(proxy_blocks_begin(), proxy_blocks_end());
  }

  /// \brief Return an iterator to the first \ref ProxyBlock.
  const_proxy_block_iterator proxy_blocks_begin() const {
    return const_proxy_block_iterator(
        boost::make_transform_iterator(this->modules_begin(),
                                       NodeToProxyBlockRange<const Module>()),
        boost::make_transform_iterator(this->modules_end(),
                                       NodeToProxyBlockRange<const Module>()));
  }

  /// \brief Return an iterator to the element following the last \ref
  /// ProxyBlock.
  const_proxy_block_iterator proxy_blocks_end() const {
    return const_proxy_block_iterator();
  }

  /// \brief Return an iterator to the first \ref ProxyBlock.
  const_proxy_block_range proxy_blocks() const {
    return boost::make_iterator_range(proxy_blocks_begin(), proxy_blocks_end());
  }
  /// @}
  // (end ProxyBlock-Related Public Types and Functions)

  /// \name Symbol-Related Public Types and Functions
  /// @{

  /// \brief Iterator over \ref Symbol objects.
  ///
  /// This iterator returns symbols in an arbitrary order.
  using symbol_iterator =
      MergeSortedIterator<Module::symbol_iterator, ArbitraryLess<Symbol>>;
  /// \brief Range of \ref Symbol objects.
  ///
  /// This range returns symbols in an arbitrary order.
  using symbol_range = boost::iterator_range<symbol_iterator>;
  /// \brief Iterator over \ref Symbol objects.
  ///
  /// This iterator returns symbols in an arbitrary order.
  using const_symbol_iterator =
      MergeSortedIterator<Module::const_symbol_iterator, ArbitraryLess<Symbol>>;
  /// \brief Range of \ref Symbol objects.
  ///
  /// This range returns symbols in an arbitrary order.
  using const_symbol_range = boost::iterator_range<const_symbol_iterator>;

  /// \brief Return an iterator to the first \ref Symbol.
  symbol_iterator symbols_begin() {
    return symbol_iterator(
        boost::make_transform_iterator(this->modules_begin(),
                                       NodeToSymbolRange<Module>()),
        boost::make_transform_iterator(this->modules_end(),
                                       NodeToSymbolRange<Module>()));
  }

  /// \brief Return an iterator to the element following the last \ref Symbol.
  symbol_iterator symbols_end() { return symbol_iterator(); }

  /// \brief Return a range of the \ref Symbol objects.
  symbol_range symbols() {
    return boost::make_iterator_range(symbols_begin(), symbols_end());
  }

  /// \brief Return an iterator to the first \ref Symbol.
  const_symbol_iterator symbols_begin() const {
    return const_symbol_iterator(
        boost::make_transform_iterator(this->modules_begin(),
                                       NodeToSymbolRange<const Module>()),
        boost::make_transform_iterator(this->modules_end(),
                                       NodeToSymbolRange<const Module>()));
  }

  /// \brief Return an iterator to the element following the last \ref Symbol.
  const_symbol_iterator symbols_end() const { return const_symbol_iterator(); }

  /// \brief Return a range of the \ref Symbol objects.
  const_symbol_range symbols() const {
    return boost::make_iterator_range(symbols_begin(), symbols_end());
  }
  /// @}
  // (end Symbol-Related Public Types and Functions)

  /// \name Section-Related Public Types and Functions
  /// @{

  /// \brief Iterator over \ref Section objects.
  using section_iterator =
      MergeSortedIterator<Module::section_iterator, AddressLess>;
  /// \brief Range of \ref Section objects.
  using section_range = boost::iterator_range<section_iterator>;
  /// \brief Sub-range of \ref Section objects overlapping an address.
  using section_subrange = boost::iterator_range<
      MergeSortedIterator<Module::section_subrange::iterator, AddressLess>>;
  /// \brief Iterator over \ref Section objects.
  using const_section_iterator =
      MergeSortedIterator<Module::const_section_iterator, AddressLess>;
  /// \brief Range of \ref Section objects.
  using const_section_range = boost::iterator_range<const_section_iterator>;
  /// \brief Sub-range of \ref Section objects overlapping an address.
  using const_section_subrange = boost::iterator_range<MergeSortedIterator<
      Module::const_section_subrange::iterator, AddressLess>>;
  /// \brief Iterator over \ref Section objects.
  using section_name_iterator =
      MergeSortedIterator<Module::section_name_iterator, AddressLess>;
  /// \brief Range of \ref Section objects.
  using section_name_range = boost::iterator_range<section_name_iterator>;
  /// \brief Iterator over \ref Section objects.
  using const_section_name_iterator =
      MergeSortedIterator<Module::const_section_name_iterator, AddressLess>;
  /// \brief Range of \ref Section objects.
  using const_section_name_range =
      boost::iterator_range<const_section_name_iterator>;

  /// \brief Return an iterator to the first \ref Section.
  section_iterator sections_begin() {
    return section_iterator(
        boost::make_transform_iterator(this->modules_begin(),
                                       NodeToSectionRange<Module>()),
        boost::make_transform_iterator(this->modules_end(),
                                       NodeToSectionRange<Module>()));
  }

  /// \brief Return an iterator to the element following the last \ref Section.
  section_iterator sections_end() { return section_iterator(); }

  /// \brief Return a range of all the \ref Section objects.
  section_range sections() {
    return boost::make_iterator_range(sections_begin(), sections_end());
  }

  /// \brief Return an iterator to the first \ref Section.
  const_section_iterator sections_begin() const {
    return const_section_iterator(
        boost::make_transform_iterator(this->modules_begin(),
                                       NodeToSectionRange<const Module>()),
        boost::make_transform_iterator(this->modules_end(),
                                       NodeToSectionRange<const Module>()));
  }

  /// \brief Return an iterator to the element following the last \ref Section.
  const_section_iterator sections_end() const {
    return const_section_iterator();
  }

  /// \brief Return a range of all the \ref Section objects.
  const_section_range sections() const {
    return boost::make_iterator_range(sections_begin(), sections_end());
  }

  /// \brief Find a Section containing an address.
  ///
  /// \param A The address to look up.
  ///
  /// \return The range of Sections containing the address.
  section_subrange findSectionsOn(Addr A) {
    return section_subrange(
        section_subrange::iterator(
            boost::make_transform_iterator(this->modules_begin(),
                                           FindSectionsIn<Module>(A)),
            boost::make_transform_iterator(this->modules_end(),
                                           FindSectionsIn<Module>(A))),
        section_subrange::iterator());
  }

  /// \brief Find a Section containing an address.
  ///
  /// \param A The address to look up.
  ///
  /// \return The range of Sections containing the address.
  const_section_subrange findSectionsOn(Addr A) const {
    return const_section_subrange(
        const_section_subrange::iterator(
            boost::make_transform_iterator(this->modules_begin(),
                                           FindSectionsIn<const Module>(A)),
            boost::make_transform_iterator(this->modules_end(),
                                           FindSectionsIn<const Module>(A))),
        const_section_subrange::iterator());
  }

  /// \brief Find all the sections that start at an address.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref Section objects that are at the address \p A.
  section_range findSectionsAt(Addr A) {
    return section_range(
        section_range::iterator(
            boost::make_transform_iterator(this->modules_begin(),
                                           FindSectionsAt<Module>(A)),
            boost::make_transform_iterator(this->modules_end(),
                                           FindSectionsAt<Module>(A))),
        section_range::iterator());
  }

  /// \brief Find all the sections that start between a range of addresses.
  ///
  /// \param Low  The low address, inclusive.
  /// \param High The high address, exclusive.
  ///
  /// \return A range of \ref Section objects that are between the addresses.
  section_range findSectionsAt(Addr Low, Addr High) {
    return section_range(
        section_range::iterator(
            boost::make_transform_iterator(
                this->modules_begin(), FindSectionsBetween<Module>(Low, High)),
            boost::make_transform_iterator(
                this->modules_end(), FindSectionsBetween<Module>(Low, High))),
        section_range::iterator());
  }

  /// \brief Find all the sections that start at an address.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref Section objects that are at the address \p A.
  const_section_range findSectionsAt(Addr A) const {
    return const_section_range(
        const_section_range::iterator(
            boost::make_transform_iterator(this->modules_begin(),
                                           FindSectionsAt<const Module>(A)),
            boost::make_transform_iterator(this->modules_end(),
                                           FindSectionsAt<const Module>(A))),
        const_section_range::iterator());
  }

  /// \brief Find all the sections that start between a range of addresses.
  ///
  /// \param Low  The low address, inclusive.
  /// \param High The high address, exclusive.
  ///
  /// \return A range of \ref Section objects that are between the addresses.
  const_section_range findSectionsAt(Addr Low, Addr High) const {
    return const_section_range(
        const_section_range::iterator(
            boost::make_transform_iterator(
                this->modules_begin(),
                FindSectionsBetween<const Module>(Low, High)),
            boost::make_transform_iterator(
                this->modules_end(),
                FindSectionsBetween<const Module>(Low, High))),
        const_section_range::iterator());
  }
  /// \brief Find all the sections containing a name.
  ///
  /// \param A The string name to look up.
  ///
  /// \return A range of \ref Section objects containing the name.
  section_name_range findSections(const std::string& X) {
    return section_name_range(
        section_name_range::iterator(
            boost::make_transform_iterator(this->modules_begin(),
                                           FindSections<Module>(X)),
            boost::make_transform_iterator(this->modules_end(),
                                           FindSections<Module>(X))),
        section_name_range::iterator());
  }

  /// \brief Find all the sections containing a name.
  ///
  /// \param A The string name to look up.
  ///
  /// \return A range of \ref Section objects containing the name.
  const_section_name_range findSections(const std::string& X) const {
    return const_section_name_range(
        const_section_name_range::iterator(
            boost::make_transform_iterator(this->modules_begin(),
                                           FindSections<const Module>(X)),
            boost::make_transform_iterator(this->modules_end(),
                                           FindSections<const Module>(X))),
        const_section_name_range::iterator());
  }
  /// @}
  // (end Section-Related Public Types and Functions)

  /// \name ByteInterval-Related Public Types and Functions
  /// @{

  /// \brief Iterator over \ref ByteInterval objects.
  using byte_interval_iterator =
      MergeSortedIterator<Module::byte_interval_iterator, AddressLess>;
  /// \brief Range of \ref ByteInterval objects.
  using byte_interval_range = boost::iterator_range<byte_interval_iterator>;
  /// \brief Sub-range of \ref ByteInterval objects overlapping addresses.
  using byte_interval_subrange = boost::iterator_range<MergeSortedIterator<
      Module::byte_interval_subrange::iterator, AddressLess>>;
  /// \brief Const iterator over \ref ByteInterval objects.
  using const_byte_interval_iterator =
      MergeSortedIterator<Module::const_byte_interval_iterator, AddressLess>;
  /// \brief Const range of \ref ByteInterval objects.
  using const_byte_interval_range =
      boost::iterator_range<const_byte_interval_iterator>;
  /// \brief Sub-range of \ref ByteInterval objects overlapping addresses.
  using const_byte_interval_subrange =
      boost::iterator_range<MergeSortedIterator<
          Module::const_byte_interval_subrange::iterator, AddressLess>>;

  /// \brief Return an iterator to the first \ref ByteInterval.
  byte_interval_iterator byte_intervals_begin() {
    return byte_interval_iterator(
        boost::make_transform_iterator(this->modules_begin(),
                                       NodeToByteIntervalRange<Module>()),
        boost::make_transform_iterator(this->modules_end(),
                                       NodeToByteIntervalRange<Module>()));
  }

  /// \brief Return an iterator to the element following the last \ref
  /// ByteInterval.
  byte_interval_iterator byte_intervals_end() {
    return byte_interval_iterator();
  }

  /// \brief Return a range of all the \ref ByteInterval objects.
  byte_interval_range byte_intervals() {
    return boost::make_iterator_range(byte_intervals_begin(),
                                      byte_intervals_end());
  }

  /// \brief Return an iterator to the first \ref ByteInterval.
  const_byte_interval_iterator byte_intervals_begin() const {
    return const_byte_interval_iterator(
        boost::make_transform_iterator(this->modules_begin(),
                                       NodeToByteIntervalRange<const Module>()),
        boost::make_transform_iterator(
            this->modules_end(), NodeToByteIntervalRange<const Module>()));
  }

  /// \brief Return an iterator to the element following the last \ref
  /// ByteInterval.
  const_byte_interval_iterator byte_intervals_end() const {
    return const_byte_interval_iterator();
  }

  /// \brief Return a range of all the \ref ByteInterval objects.
  const_byte_interval_range byte_intervals() const {
    return boost::make_iterator_range(byte_intervals_begin(),
                                      byte_intervals_end());
  }

  /// \brief Find all the intervals that have bytes that lie within the address
  /// specified.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref ByteInterval objects that intersect the address \p
  /// A.
  byte_interval_subrange findByteIntervalsOn(Addr A) {
    return byte_interval_subrange(
        byte_interval_subrange::iterator(
            boost::make_transform_iterator(this->modules_begin(),
                                           FindByteIntervalsIn<Module>(A)),
            boost::make_transform_iterator(this->modules_end(),
                                           FindByteIntervalsIn<Module>(A))),
        byte_interval_subrange::iterator());
  }

  /// \brief Find all the intervals that have bytes that lie within the address
  /// specified.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref ByteInterval objects that intersect the address \p
  /// A.
  const_byte_interval_subrange findByteIntervalsOn(Addr A) const {
    return const_byte_interval_subrange(
        const_byte_interval_subrange::iterator(
            boost::make_transform_iterator(
                this->modules_begin(), FindByteIntervalsIn<const Module>(A)),
            boost::make_transform_iterator(
                this->modules_end(), FindByteIntervalsIn<const Module>(A))),
        const_byte_interval_subrange::iterator());
  }

  /// \brief Find all the intervals that start at an address.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref ByteInterval objects that are at the address \p A.
  byte_interval_range findByteIntervalsAt(Addr A) {
    return byte_interval_range(
        byte_interval_range::iterator(
            boost::make_transform_iterator(this->modules_begin(),
                                           FindByteIntervalsAt<Module>(A)),
            boost::make_transform_iterator(this->modules_end(),
                                           FindByteIntervalsAt<Module>(A))),
        byte_interval_range::iterator());
  }

  /// \brief Find all the intervals that start between a range of addresses.
  ///
  /// \param Low  The low address, inclusive.
  /// \param High The high address, exclusive.
  ///
  /// \return A range of \ref ByteInterval objects that are between the
  /// addresses.
  byte_interval_range findByteIntervalsAt(Addr Low, Addr High) {
    return byte_interval_range(
        byte_interval_range::iterator(
            boost::make_transform_iterator(
                this->modules_begin(),
                FindByteIntervalsBetween<Module>(Low, High)),
            boost::make_transform_iterator(
                this->modules_end(),
                FindByteIntervalsBetween<Module>(Low, High))),
        byte_interval_range::iterator());
  }

  /// \brief Find all the intervals that start at an address.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref ByteInterval objects that are at the address \p A.
  const_byte_interval_range findByteIntervalsAt(Addr A) const {
    return const_byte_interval_range(
        const_byte_interval_range::iterator(
            boost::make_transform_iterator(
                this->modules_begin(), FindByteIntervalsAt<const Module>(A)),
            boost::make_transform_iterator(
                this->modules_end(), FindByteIntervalsAt<const Module>(A))),
        const_byte_interval_range::iterator());
  }

  /// \brief Find all the intervals that start between a range of addresses.
  ///
  /// \param Low  The low address, inclusive.
  /// \param High The high address, exclusive.
  ///
  /// \return A range of \ref ByteInterval objects that are between the
  /// addresses.
  const_byte_interval_range findByteIntervalsAt(Addr Low, Addr High) const {
    return const_byte_interval_range(
        const_byte_interval_range::iterator(
            boost::make_transform_iterator(
                this->modules_begin(),
                FindByteIntervalsBetween<const Module>(Low, High)),
            boost::make_transform_iterator(
                this->modules_end(),
                FindByteIntervalsBetween<const Module>(Low, High))),
        const_byte_interval_range::iterator());
  }
  /// @}
  // (end group of ByteInterval-related types and functions)

  /// \name Block-Related Public Types and Functions
  /// @{

  /// \brief Iterator over blocks.
  ///
  /// Blocks are yielded in address order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".
  using block_iterator =
      MergeSortedIterator<Module::block_iterator, BlockAddressLess>;
  /// \brief Range of blocks.
  ///
  /// Blocks are yielded in address order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".
  using block_range = boost::iterator_range<block_iterator>;
  /// \brief Sub-range of blocks overlapping an address or range of addreses.
  ///
  /// Blocks are yielded in address order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".
  using block_subrange = boost::iterator_range<
      MergeSortedIterator<Module::block_subrange::iterator, BlockAddressLess>>;
  /// \brief Iterator over blocks.
  ///
  /// Blocks are yielded in address order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".
  using const_block_iterator =
      MergeSortedIterator<Module::const_block_iterator, BlockAddressLess>;
  /// \brief Range of blocks.
  ///
  /// Blocks are yielded in address order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".
  using const_block_range = boost::iterator_range<const_block_iterator>;
  /// \brief Sub-range of blocks overlapping an address or range of addreses.
  ///
  /// Blocks are yielded in address order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".
  using const_block_subrange = boost::iterator_range<MergeSortedIterator<
      Module::const_block_subrange::iterator, BlockAddressLess>>;

  /// \brief Return an iterator to the first block.
  block_iterator blocks_begin() {
    return block_iterator(
        boost::make_transform_iterator(this->modules_begin(),
                                       NodeToBlockRange<Module>()),
        boost::make_transform_iterator(this->modules_end(),
                                       NodeToBlockRange<Module>()));
  }

  /// \brief Return an iterator to the element following the last block.
  block_iterator blocks_end() { return block_iterator(); }

  /// \brief Return a range of all the blocks.
  block_range blocks() {
    return boost::make_iterator_range(blocks_begin(), blocks_end());
  }

  /// \brief Return an iterator to the first block.
  const_block_iterator blocks_begin() const {
    return const_block_iterator(
        boost::make_transform_iterator(this->modules_begin(),
                                       NodeToBlockRange<const Module>()),
        boost::make_transform_iterator(this->modules_end(),
                                       NodeToBlockRange<const Module>()));
  }

  /// \brief Return an iterator to the element following the last block.
  const_block_iterator blocks_end() const { return const_block_iterator(); }

  /// \brief Return a range of all the blocks.
  const_block_range blocks() const {
    return boost::make_iterator_range(blocks_begin(), blocks_end());
  }

  /// \brief Find all the blocks that have bytes that lie within the address
  /// specified.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref Node objects, which are either \ref DataBlock
  /// objects or \ref CodeBlock objects, that intersect the address \p A.
  block_subrange findBlocksOn(Addr A) {
    return block_subrange(
        block_subrange::iterator(
            boost::make_transform_iterator(this->modules_begin(),
                                           FindBlocksIn<Module>(A)),
            boost::make_transform_iterator(this->modules_end(),
                                           FindBlocksIn<Module>(A))),
        block_subrange::iterator());
  }

  /// \brief Find all the blocks that have bytes that lie within the address
  /// specified.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref Node objects, which are either \ref DataBlock
  /// objects or \ref CodeBlock objects, that intersect the address \p A.
  const_block_subrange findBlocksOn(Addr A) const {
    return const_block_subrange(
        const_block_subrange::iterator(
            boost::make_transform_iterator(this->modules_begin(),
                                           FindBlocksIn<const Module>(A)),
            boost::make_transform_iterator(this->modules_end(),
                                           FindBlocksIn<const Module>(A))),
        const_block_subrange::iterator());
  }

  /// \brief Find all the blocks that start at an address.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref Node objects, which are either \ref DataBlock
  /// objects or \ref CodeBlock objects, that are at the address \p A.
  block_range findBlocksAt(Addr A) {
    return block_range(block_range::iterator(
                           boost::make_transform_iterator(
                               this->modules_begin(), FindBlocksAt<Module>(A)),
                           boost::make_transform_iterator(
                               this->modules_end(), FindBlocksAt<Module>(A))),
                       block_range::iterator());
  }

  /// \brief Find all the blocks that start between a range of addresses.
  ///
  /// \param Low  The low address, inclusive.
  /// \param High The high address, exclusive.
  ///
  /// \return A range of \ref Node objects, which are either \ref DataBlock
  /// objects or \ref CodeBlock objects, that are between the addresses.
  block_range findBlocksAt(Addr Low, Addr High) {
    return block_range(
        block_range::iterator(
            boost::make_transform_iterator(
                this->modules_begin(), FindBlocksBetween<Module>(Low, High)),
            boost::make_transform_iterator(
                this->modules_end(), FindBlocksBetween<Module>(Low, High))),
        block_range::iterator());
  }

  /// \brief Find all the blocks that start at an address.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref Node objects, which are either \ref DataBlock
  /// objects or \ref CodeBlock objects, that are at the address \p A.
  const_block_range findBlocksAt(Addr A) const {
    return const_block_range(
        const_block_range::iterator(
            boost::make_transform_iterator(this->modules_begin(),
                                           FindBlocksAt<const Module>(A)),
            boost::make_transform_iterator(this->modules_end(),
                                           FindBlocksAt<const Module>(A))),
        const_block_range::iterator());
  }

  /// \brief Find all the blocks that start between a range of addresses.
  ///
  /// \param Low  The low address, inclusive.
  /// \param High The high address, exclusive.
  ///
  /// \return A range of \ref Node objects, which are either \ref DataBlock
  /// objects or \ref CodeBlock objects, that are between the addresses.
  const_block_range findBlocksAt(Addr Low, Addr High) const {
    return const_block_range(
        const_block_range::iterator(
            boost::make_transform_iterator(
                this->modules_begin(),
                FindBlocksBetween<const Module>(Low, High)),
            boost::make_transform_iterator(
                this->modules_end(),
                FindBlocksBetween<const Module>(Low, High))),
        const_block_range::iterator());
  }
  /// @}
  // (end group of Block-related types and functions)

  /// \name CodeBlock-Related Public Types and Functions
  /// @{

  /// \brief Iterator over \ref CodeBlock objects.
  ///
  /// Blocks are yielded in address order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".
  using code_block_iterator =
      MergeSortedIterator<Module::code_block_iterator, AddressLess>;
  /// \brief Range of \ref CodeBlock objects.
  ///
  /// Blocks are yielded in address order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".
  using code_block_range = boost::iterator_range<code_block_iterator>;
  /// \brief Sub-range of \ref CodeBlock objects overlapping an address or range
  /// of addreses.
  ///
  /// Blocks are yielded in address order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".
  using code_block_subrange = boost::iterator_range<
      MergeSortedIterator<Module::code_block_subrange::iterator, AddressLess>>;
  /// \brief Iterator over \ref CodeBlock objects.
  ///
  /// Blocks are yielded in address order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".
  using const_code_block_iterator =
      MergeSortedIterator<Module::const_code_block_iterator, AddressLess>;
  /// \brief Range of \ref CodeBlock objects.
  ///
  /// Blocks are yielded in address order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".
  using const_code_block_range =
      boost::iterator_range<const_code_block_iterator>;
  /// \brief Sub-range of \ref CodeBlock objects overlapping an address or range
  /// of addreses.
  ///
  /// Blocks are yielded in address order, ascending.
  using const_code_block_subrange = boost::iterator_range<MergeSortedIterator<
      Module::const_code_block_subrange::iterator, AddressLess>>;

  /// \brief Return an iterator to the first \ref CodeBlock.
  code_block_iterator code_blocks_begin() {
    return code_block_iterator(
        boost::make_transform_iterator(this->modules_begin(),
                                       NodeToCodeBlockRange<Module>()),
        boost::make_transform_iterator(this->modules_end(),
                                       NodeToCodeBlockRange<Module>()));
  }

  /// \brief Return an iterator to the element following the last \ref
  /// CodeBlock.
  code_block_iterator code_blocks_end() { return code_block_iterator(); }

  /// \brief Return a range of all the \ref CodeBlock objects.
  code_block_range code_blocks() {
    return boost::make_iterator_range(code_blocks_begin(), code_blocks_end());
  }

  /// \brief Return an iterator to the first \ref CodeBlock.
  const_code_block_iterator code_blocks_begin() const {
    return const_code_block_iterator(
        boost::make_transform_iterator(this->modules_begin(),
                                       NodeToCodeBlockRange<const Module>()),
        boost::make_transform_iterator(this->modules_end(),
                                       NodeToCodeBlockRange<const Module>()));
  }

  /// \brief Return an iterator to the element following the last \ref
  /// CodeBlock.
  const_code_block_iterator code_blocks_end() const {
    return const_code_block_iterator();
  }

  /// \brief Return a range of all the \ref CodeBlock objects.
  const_code_block_range code_blocks() const {
    return boost::make_iterator_range(code_blocks_begin(), code_blocks_end());
  }

  /// \brief Find all the code blocks that have bytes that lie within the
  /// address specified.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref CodeNode object that intersect the address \p A.
  code_block_subrange findCodeBlocksOn(Addr A) {
    return code_block_subrange(
        code_block_subrange::iterator(
            boost::make_transform_iterator(this->modules_begin(),
                                           FindCodeBlocksIn<Module>(A)),
            boost::make_transform_iterator(this->modules_end(),
                                           FindCodeBlocksIn<Module>(A))),
        code_block_subrange::iterator());
  }

  /// \brief Find all the code blocks that have bytes that lie within the
  /// address specified.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref CodeNode object that intersect the address \p A.
  const_code_block_subrange findCodeBlocksOn(Addr A) const {
    return const_code_block_subrange(
        const_code_block_subrange::iterator(
            boost::make_transform_iterator(this->modules_begin(),
                                           FindCodeBlocksIn<const Module>(A)),
            boost::make_transform_iterator(this->modules_end(),
                                           FindCodeBlocksIn<const Module>(A))),
        const_code_block_subrange::iterator());
  }

  /// \brief Find all the code blocks that start at an address.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref CodeBlock objects that are at the address \p A.
  code_block_range findCodeBlocksAt(Addr A) {
    return code_block_range(
        code_block_range::iterator(
            boost::make_transform_iterator(this->modules_begin(),
                                           FindCodeBlocksAt<Module>(A)),
            boost::make_transform_iterator(this->modules_end(),
                                           FindCodeBlocksAt<Module>(A))),
        code_block_range::iterator());
  }

  /// \brief Find all the code blocks that start between a range of addresses.
  ///
  /// \param Low  The low address, inclusive.
  /// \param High The high address, exclusive.
  ///
  /// \return A range of \ref CodeBlock objects that are between the addresses.
  code_block_range findCodeBlocksAt(Addr Low, Addr High) {
    return code_block_range(
        code_block_range::iterator(
            boost::make_transform_iterator(
                this->modules_begin(),
                FindCodeBlocksBetween<Module>(Low, High)),
            boost::make_transform_iterator(
                this->modules_end(), FindCodeBlocksBetween<Module>(Low, High))),
        code_block_range::iterator());
  }

  /// \brief Find all the code blocks that start at an address.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref CodeBlock objects that are at the address \p A.
  const_code_block_range findCodeBlocksAt(Addr A) const {
    return const_code_block_range(
        const_code_block_range::iterator(
            boost::make_transform_iterator(this->modules_begin(),
                                           FindCodeBlocksAt<const Module>(A)),
            boost::make_transform_iterator(this->modules_end(),
                                           FindCodeBlocksAt<const Module>(A))),
        const_code_block_range::iterator());
  }

  /// \brief Find all the code blocks that start between a range of addresses.
  ///
  /// \param Low  The low address, inclusive.
  /// \param High The high address, exclusive.
  ///
  /// \return A range of \ref CodeBlock objects that are between the addresses.
  const_code_block_range findCodeBlocksAt(Addr Low, Addr High) const {
    return const_code_block_range(
        const_code_block_range::iterator(
            boost::make_transform_iterator(
                this->modules_begin(),
                FindCodeBlocksBetween<const Module>(Low, High)),
            boost::make_transform_iterator(
                this->modules_end(),
                FindCodeBlocksBetween<const Module>(Low, High))),
        const_code_block_range::iterator());
  }
  /// @}
  // (end group of CodeBlock-related types and functions)

  /// \name DataBlock-Related Public Types and Functions
  /// @{

  /// \brief Iterator over \ref DataBlock objects.
  ///
  /// Blocks are yielded in address order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".
  using data_block_iterator =
      MergeSortedIterator<Module::data_block_iterator, AddressLess>;
  /// \brief Range of \ref DataBlock objects.
  ///
  /// Blocks are yielded in address order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".
  using data_block_range = boost::iterator_range<data_block_iterator>;
  /// \brief Sub-range of \ref DataBlock objects overlapping an address or range
  /// of addreses.
  ///
  /// Blocks are yielded in address order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".
  using data_block_subrange = boost::iterator_range<
      MergeSortedIterator<Module::data_block_subrange::iterator, AddressLess>>;
  /// \brief Iterator over \ref DataBlock objects.
  ///
  /// Blocks are yielded in address order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".
  using const_data_block_iterator =
      MergeSortedIterator<Module::const_data_block_iterator, AddressLess>;
  /// \brief Range of \ref DataBlock objects.
  ///
  /// Blocks are yielded in address order, ascending.
  using const_data_block_range =
      boost::iterator_range<const_data_block_iterator>;
  /// \brief Sub-range of \ref DataBlock objects overlapping an address or range
  /// of addreses.
  ///
  /// Blocks are yielded in address order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".
  using const_data_block_subrange = boost::iterator_range<MergeSortedIterator<
      Module::const_data_block_subrange::iterator, AddressLess>>;

  /// \brief Return an iterator to the first \ref DataBlock.
  data_block_iterator data_blocks_begin() {
    return data_block_iterator(
        boost::make_transform_iterator(this->modules_begin(),
                                       NodeToDataBlockRange<Module>()),
        boost::make_transform_iterator(this->modules_end(),
                                       NodeToDataBlockRange<Module>()));
  }

  /// \brief Return an iterator to the element following the last \ref
  /// DataBlock.
  data_block_iterator data_blocks_end() { return data_block_iterator(); }

  /// \brief Return a range of all the \ref DataBlock objects.
  data_block_range data_blocks() {
    return boost::make_iterator_range(data_blocks_begin(), data_blocks_end());
  }

  /// \brief Return an iterator to the first \ref DataBlock.
  const_data_block_iterator data_blocks_begin() const {
    return const_data_block_iterator(
        boost::make_transform_iterator(this->modules_begin(),
                                       NodeToDataBlockRange<const Module>()),
        boost::make_transform_iterator(this->modules_end(),
                                       NodeToDataBlockRange<const Module>()));
  }

  /// \brief Return an iterator to the element following the last \ref
  /// DataBlock.
  const_data_block_iterator data_blocks_end() const {
    return const_data_block_iterator();
  }

  /// \brief Return a range of all the \ref DataBlock objects.
  const_data_block_range data_blocks() const {
    return boost::make_iterator_range(data_blocks_begin(), data_blocks_end());
  }

  /// \brief Find all the data blocks that have bytes that lie within the
  /// address specified.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref DataNode object that intersect the address \p A.
  data_block_subrange findDataBlocksOn(Addr A) {
    return data_block_subrange(
        data_block_subrange::iterator(
            boost::make_transform_iterator(this->modules_begin(),
                                           FindDataBlocksIn<Module>(A)),
            boost::make_transform_iterator(this->modules_end(),
                                           FindDataBlocksIn<Module>(A))),
        data_block_subrange::iterator());
  }

  /// \brief Find all the data blocks that have bytes that lie within the
  /// address specified.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref DataNode object that intersect the address \p A.
  const_data_block_subrange findDataBlocksOn(Addr A) const {
    return const_data_block_subrange(
        const_data_block_subrange::iterator(
            boost::make_transform_iterator(this->modules_begin(),
                                           FindDataBlocksIn<const Module>(A)),
            boost::make_transform_iterator(this->modules_end(),
                                           FindDataBlocksIn<const Module>(A))),
        const_data_block_subrange::iterator());
  }

  /// \brief Find all the data blocks that start at an address.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref DataBlock objects that are at the address \p A.
  data_block_range findDataBlocksAt(Addr A) {
    return data_block_range(
        data_block_range::iterator(
            boost::make_transform_iterator(this->modules_begin(),
                                           FindDataBlocksAt<Module>(A)),
            boost::make_transform_iterator(this->modules_end(),
                                           FindDataBlocksAt<Module>(A))),
        data_block_range::iterator());
  }

  /// \brief Find all the data blocks that start between a range of addresses.
  ///
  /// \param Low  The low address, inclusive.
  /// \param High The high address, exclusive.
  ///
  /// \return A range of \ref DataBlock objects that are between the addresses.
  data_block_range findDataBlocksAt(Addr Low, Addr High) {
    return data_block_range(
        data_block_range::iterator(
            boost::make_transform_iterator(
                this->modules_begin(),
                FindDataBlocksBetween<Module>(Low, High)),
            boost::make_transform_iterator(
                this->modules_end(), FindDataBlocksBetween<Module>(Low, High))),
        data_block_range::iterator());
  }

  /// \brief Find all the data blocks that start at an address.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref DataBlock objects that are at the address \p A.
  const_data_block_range findDataBlocksAt(Addr A) const {
    return const_data_block_range(
        const_data_block_range::iterator(
            boost::make_transform_iterator(this->modules_begin(),
                                           FindDataBlocksAt<const Module>(A)),
            boost::make_transform_iterator(this->modules_end(),
                                           FindDataBlocksAt<const Module>(A))),
        const_data_block_range::iterator());
  }

  /// \brief Find all the data blocks that start between a range of addresses.
  ///
  /// \param Low  The low address, inclusive.
  /// \param High The high address, exclusive.
  ///
  /// \return A range of \ref DataBlock objects that are between the addresses.
  const_data_block_range findDataBlocksAt(Addr Low, Addr High) const {
    return const_data_block_range(
        const_data_block_range::iterator(
            boost::make_transform_iterator(
                this->modules_begin(),
                FindDataBlocksBetween<const Module>(Low, High)),
            boost::make_transform_iterator(
                this->modules_end(),
                FindDataBlocksBetween<const Module>(Low, High))),
        const_data_block_range::iterator());
  }
  /// @}
  // (end group of DataBlock-related types and functions)

  /// \name SymbolicExpression-Related Public Types and Functions
  /// @{

  /// \brief Iterator over \ref SymbolicExpressionElement objects.
  ///
  /// Results are yielded in address order, ascending.
  using symbolic_expression_iterator =
      MergeSortedIterator<Module::symbolic_expression_iterator,
                          ByteInterval::SymbolicExpressionElement::AddressLess>;
  /// \brief Range of \ref SymbolicExpressionElement objects.
  ///
  /// Results are yielded in address order, ascending.
  using symbolic_expression_range =
      boost::iterator_range<symbolic_expression_iterator>;
  /// \brief Iterator over \ref SymbolicExpressionElement objects.
  ///
  /// Results are yielded in address order, ascending.
  using const_symbolic_expression_iterator = MergeSortedIterator<
      Module::const_symbolic_expression_iterator,
      ByteInterval::ConstSymbolicExpressionElement::AddressLess>;
  /// \brief Range of \ref SymbolicExpressionElement objects.
  ///
  /// Results are yielded in address order, ascending.
  using const_symbolic_expression_range =
      boost::iterator_range<const_symbolic_expression_iterator>;

  /// \brief Return an iterator to the first \ref SymbolicExpression.
  symbolic_expression_iterator symbolic_expressions_begin() {
    return symbolic_expression_iterator(
        boost::make_transform_iterator(this->modules_begin(),
                                       NodeToSymbolicExpressionRange<Module>()),
        boost::make_transform_iterator(
            this->modules_end(), NodeToSymbolicExpressionRange<Module>()));
  }

  /// \brief Return an iterator to the element following the last \ref
  /// SymbolicExpression.
  symbolic_expression_iterator symbolic_expressions_end() {
    return symbolic_expression_iterator();
  }

  /// \brief Return a range of all the \ref SymbolicExpression objects.
  symbolic_expression_range symbolic_expressions() {
    return boost::make_iterator_range(symbolic_expressions_begin(),
                                      symbolic_expressions_end());
  }

  /// \brief Return an iterator to the first \ref SymbolicExpression.
  const_symbolic_expression_iterator symbolic_expressions_begin() const {
    return const_symbolic_expression_iterator(
        boost::make_transform_iterator(
            this->modules_begin(),
            NodeToSymbolicExpressionRange<const Module>()),
        boost::make_transform_iterator(
            this->modules_end(),
            NodeToSymbolicExpressionRange<const Module>()));
  }

  /// \brief Return an iterator to the element following the last \ref
  /// SymbolicExpression.
  const_symbolic_expression_iterator symbolic_expressions_end() const {
    return const_symbolic_expression_iterator();
  }

  /// \brief Return a range of all the \ref SymbolicExpression objects.
  const_symbolic_expression_range symbolic_expressions() const {
    return boost::make_iterator_range(symbolic_expressions_begin(),
                                      symbolic_expressions_end());
  }

  /// \brief Find all the symbolic expressions that start at an address.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref SymbolicExpression objects that are at the address
  /// \p A.
  symbolic_expression_range findSymbolicExpressionsAt(Addr A) {
    return symbolic_expression_range(
        symbolic_expression_range::iterator(
            boost::make_transform_iterator(this->modules_begin(),
                                           FindSymExprsAt<Module>(A)),
            boost::make_transform_iterator(this->modules_end(),
                                           FindSymExprsAt<Module>(A))),
        symbolic_expression_range::iterator());
  }

  /// \brief Find all the symbolic expressions that start between a range of
  /// addresses.
  ///
  /// \param Low  The low address, inclusive.
  /// \param High The high address, exclusive.
  ///
  /// \return A range of \ref SymbolicExpression objects that are between the
  /// addresses.
  symbolic_expression_range findSymbolicExpressionsAt(Addr Low, Addr High) {
    return symbolic_expression_range(
        symbolic_expression_range::iterator(
            boost::make_transform_iterator(
                this->modules_begin(), FindSymExprsBetween<Module>(Low, High)),
            boost::make_transform_iterator(
                this->modules_end(), FindSymExprsBetween<Module>(Low, High))),
        symbolic_expression_range::iterator());
  }

  /// \brief Find all the symbolic expressions that start at an address.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref SymbolicExpression objects that are at the address
  /// \p A.
  const_symbolic_expression_range findSymbolicExpressionsAt(Addr A) const {
    return const_symbolic_expression_range(
        const_symbolic_expression_range::iterator(
            boost::make_transform_iterator(this->modules_begin(),
                                           FindSymExprsAt<const Module>(A)),
            boost::make_transform_iterator(this->modules_end(),
                                           FindSymExprsAt<const Module>(A))),
        const_symbolic_expression_range::iterator());
  }

  /// \brief Find all the symbolic expressions that start between a range of
  /// addresses.
  ///
  /// \param Low  The low address, inclusive.
  /// \param High The high address, exclusive.
  ///
  /// \return A range of \ref SymbolicExpression objects that are between the
  /// addresses.
  const_symbolic_expression_range findSymbolicExpressionsAt(Addr Low,
                                                            Addr High) const {
    return const_symbolic_expression_range(
        const_symbolic_expression_range::iterator(
            boost::make_transform_iterator(
                this->modules_begin(),
                FindSymExprsBetween<const Module>(Low, High)),
            boost::make_transform_iterator(
                this->modules_end(),
                FindSymExprsBetween<const Module>(Low, High))),
        const_symbolic_expression_range::iterator());
  }
  /// @}
  // (end group of SymbolicExpression-related types and functions)

  /// \cond INTERNAL
  static bool classof(const Node* N) { return N->getKind() == Kind::IR; }
  /// \endcond

  /// \brief Get the version of the Protobuf used when creating this IR.
  ///
  /// Backwards-incompatible changes to the Protobuf structure of GTIRB cause
  /// this verison number to increment.
  uint32_t getVersion() const { return Version; }

  /// \brief Set the version of the Protobuf used when creating this IR.
  ///
  /// Backwards-incompatible changes to the Protobuf structure of GTIRB cause
  /// this verison number to increment. This function is useful when, for
  /// example, migrating GTIRB from old versions to new versions of the Protobuf
  /// format.
  void setVersion(uint32_t V) { Version = V; }

private:
  /// @cond INTERNAL
  /// \brief The protobuf message type used for serializing IR.
  using MessageType = proto::IR;

  /// \brief Serialize into a protobuf message.
  ///
  /// \param[out] Message   Serialize into this message.
  ///
  /// \return void
  void toProtobuf(MessageType* Message) const;

  /// \brief Construct a IR from a protobuf message.
  ///
  /// \param C   The Context in which the deserialized IR will be held.
  /// \param Message  The protobuf message from which to deserialize.
  ///
  /// \return The deserialized IR object, or null on failure.
  static ErrorOr<IR*> fromProtobuf(Context& C, const MessageType& Message);
  /// @endcond

  ModuleSet Modules;
  uint32_t Version{GTIRB_PROTOBUF_VERSION};
  CFG Cfg;

  std::unique_ptr<ModuleObserver> MO;

  friend class Context; // Allow Context to construct new IRs.
};

/// \brief The error category used to represent load failures.
/// \return The load failure error category.
GTIRB_EXPORT_API const std::error_category& loadErrorCategory();

/// \brief Makes an \ref std::error_code object from an \ref IR::load_error
/// object.
/// \return The error code.
inline std::error_code make_error_code(gtirb::IR::load_error e) {
  return std::error_code(static_cast<int>(e), loadErrorCategory());
}

} // namespace gtirb

namespace std {
template <>
struct is_error_code_enum<gtirb::IR::load_error> : std::true_type {};
} // namespace std

#endif // GTIRB_IR_H


================================================
FILE: include/gtirb/Module.hpp
================================================
//===- Module.hpp -----------------------------------------------*- C++ -*-===//
//
//  Copyright (C) 2021 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
#ifndef GTIRB_MODULE_H
#define GTIRB_MODULE_H

#include <gtirb/Addr.hpp>
#include <gtirb/AuxDataContainer.hpp>
#include <gtirb/DataBlock.hpp>
#include <gtirb/Export.hpp>
#include <gtirb/Node.hpp>
#include <gtirb/Observer.hpp>
#include <gtirb/Section.hpp>
#include <gtirb/Symbol.hpp>
#include <gtirb/SymbolicExpression.hpp>
#include <gtirb/Utility.hpp>
#include <gtirb/proto/Module.pb.h>
#include <algorithm>
#include <boost/icl/interval_map.hpp>
#include <boost/iterator/indirect_iterator.hpp>
#include <boost/iterator/iterator_traits.hpp>
#include <boost/iterator/transform_iterator.hpp>
#include <boost/multi_index/hashed_index.hpp>
#include <boost/multi_index/key_extractors.hpp>
#include <boost/multi_index/mem_fun.hpp>
#include <boost/multi_index/ordered_index.hpp>
#include <boost/multi_index_container.hpp>
#include <boost/range/iterator_range.hpp>
#include <cstdint>
#include <functional>
#include <optional>
#include <string>

/// \file Module.hpp
/// \brief Class gtirb::Module and related functions and types.

namespace gtirb {
class ByteInterval;
class IR;
class ModuleObserver;

template <class T> class ErrorOr;

/// \enum FileFormat
///
/// \brief Identifies an exectuable file format.
enum class FileFormat : uint8_t {
  Undefined = proto::Format_Undefined, ///< Default value indicates an
                                       ///< uninitialized state.
  COFF = proto::COFF,                  ///< Common Object File Format (COFF)
  ELF = proto::ELF, ///< Executable and Linkable Format (ELF, formerly named
                    ///< Extensible Linking Format)
  PE = proto::PE,   ///< Microsoft Portable Executable (PE) format.
  IdaProDb32 = proto::IdaProDb32, ///< IDA Pro database file
  IdaProDb64 = proto::IdaProDb64, ///< IDA Pro database file
  XCOFF = proto::XCOFF, ///< Non-COFF (files start with ANON_OBJECT_HEADER*)
  MACHO = proto::MACHO, ///< Mach object file format
  RAW = proto::RAW      ///< Raw binary file (no format)
};

/// \enum ISAID
///
/// \brief Idenfities an instruction set.
enum class ISA : uint8_t {
  Undefined = proto::ISA_Undefined, ///< Default value to indicates an
                                    ///< uninitialized state.
  IA32 = proto::IA32,   ///< Intel Architecture, 32-bit. Also known as i386.
  PPC32 = proto::PPC32, ///< Performance Optimization With Enhanced RISC –
                        ///< Performance Computing, 32-bit.
  X64 = proto::X64,     ///< The generic name for the 64-bit
                        ///< extensions to both Intel's and AMD's 32-bit
                        ///< x86 instruction set architecture (ISA).
  ARM = proto::ARM,     ///< Advanced RISC Machine, also known as Acorn RISC
                        ///< Machine, 32-bit.
  ValidButUnsupported = proto::ValidButUnsupported,
  PPC64 = proto::PPC64,   ///< Performance Optimization With Enhanced RISC –
                          ///< Performance Computing, 64-bit.
  ARM64 = proto::ARM64,   ///< Advanced RISC Machine, also known as Acorn RISC
                          ///< Machine, 64-bit.
  MIPS32 = proto::MIPS32, ///< Microprocessor without Interlocked Pipelined
                          ///< Stages, 32-bit.
  MIPS64 = proto::MIPS64  ///< Microprocessor without Interlocked Pipelined
                          ///< Stages, 64-bit.
};

enum class ByteOrder : uint8_t {
  Undefined = proto::ByteOrder_Undefined, ///< Unknown or uninitialized
                                          ///< endianness.
  Big = proto::BigEndian,                 ///< Big endian.
  Little = proto::LittleEndian,           ///< Little endian.
};

/// \class Module
///
/// \brief Represents a single binary (library or executable).
class GTIRB_EXPORT_API Module : public AuxDataContainer {
  struct by_address {};
  struct by_name {};
  struct by_pointer {};
  struct by_referent {};

  // Helper function for extracting the referent of a Symbol.
  static const Node* get_symbol_referent(const Symbol& S) {
    if (std::optional<const Node*> Res =
            S.visit([](const Node* N) { return N; })) {
      return *Res;
    }
    return nullptr;
  }

  using ProxyBlockSet = std::unordered_set<ProxyBlock*>;

  using SectionSet = boost::multi_index::multi_index_container<
      Section*, boost::multi_index::indexed_by<
                    boost::multi_index::ordered_non_unique<
                        boost::multi_index::tag<by_address>,
                        boost::multi_index::identity<Section*>, AddressLess>,
                    boost::multi_index::ordered_non_unique<
                        boost::multi_index::tag<by_name>,
                        boost::multi_index::const_mem_fun<
                            Section, const std::string&, &Section::getName>>,
                    boost::multi_index::hashed_unique<
                        boost::multi_index::tag<by_pointer>,
                        boost::multi_index::identity<Section*>>>>;
  using SectionIntMap =
      boost::icl::interval_map<Addr, std::set<Section*, AddressLess>>;

  using SymbolSet = boost::multi_index::multi_index_container<
      Symbol*,
      boost::multi_index::indexed_by<
          boost::multi_index::ordered_non_unique<
              boost::multi_index::tag<by_address>,
              boost::multi_index::const_mem_fun<Symbol, std::optional<Addr>,
                                                &Symbol::getAddress>>,
          boost::multi_index::ordered_non_unique<
              boost::multi_index::tag<by_name>,
              boost::multi_index::const_mem_fun<Symbol, const std::string&,
                                                &Symbol::getName>>,
          boost::multi_index::hashed_unique<
              boost::multi_index::tag<by_pointer>,
              boost::multi_index::identity<Symbol*>>,
          boost::multi_index::hashed_non_unique<
              boost::multi_index::tag<by_referent>,
              boost::multi_index::global_fun<const Symbol&, const Node*,
                                             &get_symbol_referent>>>>;

  class SectionObserverImpl;
  class SymbolObserverImpl;

  Module(Context& C, const std::string& N);
  Module(Context& C, const std::string& N, const UUID& U);

  static Module* Create(Context& C, const std::string& N, const UUID& U) {
    return C.Create<Module>(C, N, U);
  }

public:
  /// \brief Create a Module object.
  ///
  /// \param C      The Context in which this object will be held.
  /// \param Name   The name of this module.
  ///
  /// \return The newly created object.
  static Module* Create(Context& C, const std::string& Name) {
    return C.Create<Module>(C, Name);
  }

  /// \brief Get the \ref IR this module belongs to.
  const IR* getIR() const { return Parent; }
  /// \brief Get the \ref IR this module belongs to.
  IR* getIR() { return Parent; }

  /// \brief Set the location of the corresponding binary on disk.
  ///
  /// This is for informational purposes only and will not be used to open
  /// the image, so it does not need to be the path of an existing file.
  ///
  /// \param X The path name to use.
  void setBinaryPath(const std::string& X) { BinaryPath = X; }

  /// \brief Get the location of the corresponding binary on disk.
  ///
  /// \return   The path to the corresponding binary on disk.
  const std::string& getBinaryPath() const { return BinaryPath; }

  /// \brief Set the format of the binary pointed to by getBinaryPath().
  ///
  /// \param X   The format of the binary associated with \c this, as a
  ///            gtirb::FileFormat enumerator.
  void setFileFormat(gtirb::FileFormat X) { this->FileFormat = X; }

  /// \brief Get the format of the binary pointed to by getBinaryPath().
  ///
  /// \return   The format of the binary associated with \c this, as a
  ///           gtirb::FileFormat enumerator.
  gtirb::FileFormat getFileFormat() const { return this->FileFormat; }

  /// \brief Set the difference between this module's
  /// \ref Module::setPreferredAddr "preferred address" and the address where it
  /// was actually loaded.
  ///
  /// \param X The rebase delta.
  ///
  /// \return void
  void setRebaseDelta(int64_t X) { RebaseDelta = X; }

  /// \brief Get the difference between this module's
  /// \ref Module::setPreferredAddr "preferred address" and
  /// the address where it was actually loaded.
  ///
  /// \return The rebase delta.
  int64_t getRebaseDelta() const { return RebaseDelta; }

  /// \brief Set the preferred address for loading this module.
  ///
  /// \param X The address to use.
  ///
  /// \return void
  /// \sa setRebaseDelta
  void setPreferredAddr(gtirb::Addr X) { PreferredAddr = X; }

  /// \brief Get the preferred address for loading this module.
  ///
  /// \return The preferred address.
  /// \sa getRebaseDelta
  gtirb::Addr getPreferredAddr() const { return PreferredAddr; }

  /// \brief Has the image been loaded somewhere other than its preferred
  /// address?
  ///
  /// \return \c true if the loaded image has been relocated, \c false
  /// otherwise.
  ///
  /// \sa getPreferredAddr
  /// \sa getRebaseDelta
  bool isRelocated() const { return RebaseDelta != 0; }

  /// \brief Set the ISA of the instructions in this Module.
  ///
  /// \param X The ISA ID to set.
  void setISA(gtirb::ISA X) { Isa = X; }

  /// \brief Get the ISA of the instructions in this Module.
  ///
  /// \return The ISA ID.
  gtirb::ISA getISA() const { return Isa; }

  /// \brief Set the endianness of the instructions in this Module.
  ///
  /// \param X The endianness to set.
  void setByteOrder(gtirb::ByteOrder X) { ByteOrder = X; }

  /// \brief Get the endianness of the instructions in this Module.
  ///
  /// \return The endianness.
  gtirb::ByteOrder getByteOrder() const { return ByteOrder; }

  /// \brief Get the entry point of this module, or null if not present.
  const CodeBlock* getEntryPoint() const { return EntryPoint; }
  /// \brief Get the entry point of this module, or null if not present.
  CodeBlock* getEntryPoint() { return EntryPoint; }

  /// \brief Set the entry point of this module.
  ///
  /// \param CB The entry point of this module, or null if not present.
  void setEntryPoint(CodeBlock* CB) { EntryPoint = CB; }

  /// \name ProxyBlock-Related Public Types and Functions
  /// @{

  /// \brief Iterator over proxy_blocks (\ref ProxyBlock).
  using proxy_block_iterator =
      boost::indirect_iterator<ProxyBlockSet::iterator>;
  /// \brief Range of proxy_blocks (\ref ProxyBlock).
  using proxy_block_range = boost::iterator_range<proxy_block_iterator>;
  /// \brief Constant iterator over proxy_blocks (\ref ProxyBlock).
  using const_proxy_block_iterator =
      boost::indirect_iterator<ProxyBlockSet::const_iterator, const ProxyBlock>;
  /// \brief Constant range of proxy_blocks (\ref ProxyBlock).
  using const_proxy_block_range =
      boost::iterator_range<const_proxy_block_iterator>;

  /// \brief Return an iterator to the first ProxyBlock.
  proxy_block_iterator proxy_blocks_begin() {
    return proxy_block_iterator(ProxyBlocks.begin());
  }
  /// \brief Return a constant iterator to the first ProxyBlock.
  const_proxy_block_iterator proxy_blocks_begin() const {
    return const_proxy_block_iterator(ProxyBlocks.begin());
  }
  /// \brief Return an iterator to the element following the last ProxyBlock.
  proxy_block_iterator proxy_blocks_end() {
    return proxy_block_iterator(ProxyBlocks.end());
  }
  /// \brief Return a constant iterator to the element following the last
  /// ProxyBlock.
  const_proxy_block_iterator proxy_blocks_end() const {
    return const_proxy_block_iterator(ProxyBlocks.end());
  }
  /// \brief Return a range of the proxy_blocks (\ref ProxyBlock).
  proxy_block_range proxy_blocks() {
    return boost::make_iterator_range(proxy_blocks_begin(), proxy_blocks_end());
  }
  /// \brief Return a constant range of the proxy_blocks (\ref ProxyBlock).
  const_proxy_block_range proxy_blocks() const {
    return boost::make_iterator_range(proxy_blocks_begin(), proxy_blocks_end());
  }

  /// \brief Remove a \ref ProxyBlock object located in this module.
  ///
  /// \param B The \ref ProxyBlock object to remove.
  ///
  /// \return Whether the operation succeeded (\c Accepted), made no change
  /// (\c NoChange), or could not be completed (\c Rejected). In particular,
  /// if the node to remove is not actually part of this node to begin with,
  /// the result will be \c NoChange.
  ChangeStatus removeProxyBlock(ProxyBlock* B);

  /// \brief Adds a new \ref ProxyBlock in this module.
  ///
  /// \param PB The \ref ProxyBlock object to add.
  ///
  /// \return a ChangeStatus indicating whether the insertion took place
  /// (\c Accepted), was unnecessary because this node already contained the
  /// ProxyBlock (\c NoChange), or could not be completed (\c Rejected).
  ChangeStatus addProxyBlock(ProxyBlock* PB);

  /// \brief Creates a new \ref ProxyBlock in this module.
  ///
  /// \tparam Args  The arguments to construct a \ref ProxyBlock.
  /// \param  C     The Context in which this object will be held.
  /// \param  A     The arguments to construct a \ref ProxyBlock.
  ///
  /// \return the created ProxyBlock.
  template <typename... Args>
  ProxyBlock* addProxyBlock(Context& C, Args&&... A) {
    ProxyBlock* PB = ProxyBlock::Create(C, std::forward<Args>(A)...);
    [[maybe_unused]] ChangeStatus status = addProxyBlock(PB);
    // addProxyBlock(ProxyBlock*) does not currently reject any changes and,
    // because we just created the ProxyBlock to add, it cannot result in
    // NoChange.
    assert(status == ChangeStatus::Accepted &&
           "unexpected result when inserting ProxyBlock");
    return PB;
  }

  /// @}
  // (end of ProxyBlock-Related Public Types and Functions)

  /// \name Symbol-Related Public Types and Functions
  /// @{

  /// \brief Iterator over symbols (\ref Symbol).
  ///
  /// This iterator returns symbols in an arbitrary order.
  using symbol_iterator =
      boost::indirect_iterator<SymbolSet::index<by_pointer>::type::iterator>;
  /// \brief Range of symbols (\ref Symbol).
  ///
  /// This range returns symbols in an arbitrary order.
  using symbol_range = boost::iterator_range<symbol_iterator>;
  /// \brief Constant iterator over symbols (\ref Symbol).
  ///
  /// This iterator returns symbols in an arbitrary order.
  using const_symbol_iterator = boost::indirect_iterator<
      SymbolSet::index<by_pointer>::type::const_iterator, const Symbol>;
  /// \brief Constant range of symbols (\ref Symbol).
  ///
  /// This range returns symbols in an arbitrary order.
  using const_symbol_range = boost::iterator_range<const_symbol_iterator>;

  /// \brief Iterator over symbols (\ref Symbol).
  ///
  /// This iterator returns symbols in name order. If two Symbols have the same
  /// name, their order is unspecified.
  using symbol_name_iterator =
      boost::indirect_iterator<SymbolSet::index<by_name>::type::iterator>;
  /// \brief Range of symbols (\ref Symbol).
  ///
  /// This range returns symbols in name order. If two Symbols have the same
  /// name, their order is unspecified.
  using symbol_name_range = boost::iterator_range<symbol_name_iterator>;
  /// \brief Constant iterator over symbols (\ref Symbol).
  ///
  /// This iterator returns symbols in name order. If two Symbols have the same
  /// name, their order is unspecified.
  using const_symbol_name_iterator =
      boost::indirect_iterator<SymbolSet::index<by_name>::type::const_iterator,
                               const Symbol>;
  /// \brief Constant range of symbols (\ref Symbol).
  ///
  /// This range returns symbols in name order. If two Symbols have the same
  /// name, their order is unspecified.
  using const_symbol_name_range =
      boost::iterator_range<const_symbol_name_iterator>;

  /// \brief Iterator over symbols (\ref Symbol).
  ///
  /// This iterator returns symbols in address order. If two Symbols have the
  /// same address, their order is unspecified.
  using symbol_addr_iterator =
      boost::indirect_iterator<SymbolSet::index<by_address>::type::iterator>;
  /// \brief Range of symbols (\ref Symbol).
  ///
  /// This range returns symbols in address order. If two Symbols have the same
  /// address, their order is unspecified.
  using symbol_addr_range = boost::iterator_range<symbol_addr_iterator>;
  /// \brief Constant iterator over symbols (\ref Symbol).
  ///
  /// This iterator returns symbols in address order. If two Symbols have the
  /// same address, their order is unspecified.
  using const_symbol_addr_iterator = boost::indirect_iterator<
      SymbolSet::index<by_address>::type::const_iterator, const Symbol>;
  /// \brief Constant range of symbols (\ref Symbol).
  ///
  /// This range returns symbols in address order. If two Symbols have the same
  /// address, their order is unspecified.
  using const_symbol_addr_range =
      boost::iterator_range<const_symbol_addr_iterator>;

  /// \brief Iterator over symbols (\ref Symbol).
  ///
  /// The order in which this iterator returns symbols is not specified.
  using symbol_ref_iterator =
      boost::indirect_iterator<SymbolSet::index<by_referent>::type::iterator>;
  /// \brief Range of symbols (\ref Symbol).
  ///
  /// The order of the symbols in this range is not specified.
  using symbol_ref_range = boost::iterator_range<symbol_ref_iterator>;
  /// \brief Constant iterator over symbols (\ref Symbol).
  ///
  /// The order in which this iterator returns symbols is not specified.
  using const_symbol_ref_iterator = boost::indirect_iterator<
      SymbolSet::index<by_referent>::type::const_iterator, const Symbol>;
  /// \brief Constant range of symbols (\ref Symbol).
  ///
  /// The order of the symbols in this range is not specified.
  using const_symbol_ref_range =
      boost::iterator_range<const_symbol_ref_iterator>;

  /// \brief Return an iterator to the first Symbol.
  symbol_iterator symbols_begin() {
    return symbol_iterator(Symbols.get<by_pointer>().begin());
  }
  /// \brief Return a constant iterator to the first Symbol.
  const_symbol_iterator symbols_begin() const {
    return const_symbol_iterator(Symbols.get<by_pointer>().begin());
  }
  /// \brief Return an iterator to the element following the last Symbol.
  symbol_iterator symbols_end() {
    return symbol_iterator(Symbols.get<by_pointer>().end());
  }
  /// \brief Return a constant iterator to the element following the last
  /// Symbol.
  const_symbol_iterator symbols_end() const {
    return const_symbol_iterator(Symbols.get<by_pointer>().end());
  }
  /// \brief Return a range of the symbols (\ref Symbol).
  symbol_range symbols() {
    return boost::make_iterator_range(symbols_begin(), symbols_end());
  }
  /// \brief Return a constant range of the symbols (\ref Symbol).
  const_symbol_range symbols() const {
    return boost::make_iterator_range(symbols_begin(), symbols_end());
  }

  /// \brief Return an iterator to the first Symbol, ordered by name.
  symbol_name_iterator symbols_by_name_begin() {
    return symbol_name_iterator(Symbols.get<by_name>().begin());
  }
  /// \brief Return a constant iterator to the first Symbol, ordered by name.
  const_symbol_name_iterator symbols_by_name_begin() const {
    return const_symbol_name_iterator(Symbols.get<by_name>().begin());
  }
  /// \brief Return an iterator to the element following the last Symbol,
  /// ordered by name.
  symbol_name_iterator symbols_by_name_end() {
    return symbol_name_iterator(Symbols.get<by_name>().end());
  }
  /// \brief Return a constant iterator to the element following the last
  /// Symbol, ordered by name.
  const_symbol_name_iterator symbols_by_name_end() const {
    return const_symbol_name_iterator(Symbols.get<by_name>().end());
  }
  /// \brief Return a range of the symbols (\ref Symbol), ordered by name.
  symbol_name_range symbols_by_name() {
    return boost::make_iterator_range(symbols_by_name_begin(),
                                      symbols_by_name_end());
  }
  /// \brief Return a constant range of the symbols (\ref Symbol), ordered by
  /// name.
  const_symbol_name_range symbols_by_name() const {
    return boost::make_iterator_range(symbols_by_name_begin(),
                                      symbols_by_name_end());
  }

  /// \brief Return an iterator to the first Symbol, ordered by address.
  symbol_addr_iterator symbols_by_addr_begin() {
    return symbol_addr_iterator(Symbols.get<by_address>().begin());
  }
  /// \brief Return a constant iterator to the first Symbol, ordered by address.
  const_symbol_addr_iterator symbols_by_addr_begin() const {
    return const_symbol_addr_iterator(Symbols.get<by_address>().begin());
  }
  /// \brief Return an iterator to the element following the last Symbol,
  /// ordered by address.
  symbol_addr_iterator symbols_by_addr_end() {
    return symbol_addr_iterator(Symbols.get<by_address>().end());
  }
  /// \brief Return a constant iterator to the element following the last
  /// Symbol, ordered by address.
  const_symbol_addr_iterator symbols_by_addr_end() const {
    return const_symbol_addr_iterator(Symbols.get<by_address>().end());
  }
  /// \brief Return a range of the symbols (\ref Symbol), ordered by address.
  symbol_addr_range symbols_by_addr() {
    return boost::make_iterator_range(symbols_by_addr_begin(),
                                      symbols_by_addr_end());
  }
  /// \brief Return a constant range of the symbols (\ref Symbol), ordered by
  /// address.
  const_symbol_addr_range symbols_by_addr() const {
    return boost::make_iterator_range(symbols_by_addr_begin(),
                                      symbols_by_addr_end());
  }

  /// \brief Remove a \ref Symbol object located in this module.
  ///
  /// \param S The \ref Symbol object to remove.
  ///
  /// \return Whether or not the operation succeeded. This operation can
  /// fail if the node to remove is not actually part of this node to begin
  /// with.
  bool removeSymbol(Symbol* S) {
    auto& Index = Symbols.get<by_pointer>();
    if (auto Iter = Index.find(S); Iter != Index.end()) {
      Index.erase(Iter);
      S->setParent(nullptr, nullptr);
      return true;
    }
    return false;
  }

  /// \brief Move a \ref Symbol object to be located in this module.
  ///
  /// \param S The \ref Symbol object to add.
  Symbol* addSymbol(Symbol* S) {
    if (S->getModule()) {
      S->getModule()->removeSymbol(S);
    }
    Symbols.emplace(S);
    S->setParent(this, SymObs.get());
    return S;
  }

  /// \brief Creates a new \ref Symbol in this module.
  ///
  /// \tparam Args  The arguments to construct a \ref Symbol.
  /// \param  C     The Context in which this object will be held.
  /// \param  A     The arguments to construct a \ref Symbol.
  template <typename... Args> Symbol* addSymbol(Context& C, Args... A) {
    return addSymbol(Symbol::Create(C, A...));
  }

  /// \brief Find symbols by name
  ///
  /// \param N The name to look up.
  ///
  /// \return A possibly empty range of all the symbols with the
  /// given name.
  symbol_name_range findSymbols(const std::string& N) {
    auto Found = Symbols.get<by_name>().equal_range(N);
    return boost::make_iterator_range(Found.first, Found.second);
  }

  /// \brief Find symbols by name
  ///
  /// \param N The name to look up.
  ///
  /// \return A possibly empty constant range of all the symbols with the
  /// given name.
  const_symbol_name_range findSymbols(const std::string& N) const {
    auto Found = Symbols.get<by_name>().equal_range(N);
    return boost::make_iterator_range(Found.first, Found.second);
  }

  /// \brief Find symbols by address.
  ///
  /// \param X The address to look up.
  ///
  /// \return A possibly empty range of all the symbols with a referent at the
  /// given address.
  symbol_addr_range findSymbols(Addr X) {
    auto Found = Symbols.get<by_address>().equal_range(X);
    return boost::make_iterator_range(Found.first, Found.second);
  }

  /// \brief Find symbols by address.
  ///
  /// \param X The address to look up.
  ///
  /// \return A possibly empty constant range of all the symbols with a referent
  /// at the given address.
  const_symbol_addr_range findSymbols(Addr X) const {
    auto Found = Symbols.get<by_address>().equal_range(X);
    return boost::make_iterator_range(Found.first, Found.second);
  }

  /// \brief Find symbols by a range of addresses.
  ///
  /// \param Lower The lower-bounded address to look up.
  /// \param Upper The upper-bounded address to look up.
  ///
  /// \return A possibly empty range of all the symbols within the given
  /// address range. Searches the range [Lower, Upper).
  symbol_addr_range findSymbols(Addr Lower, Addr Upper) {
    auto& Index = Symbols.get<by_address>();
    return boost::make_iterator_range(Index.lower_bound(Lower),
                                      Index.lower_bound(Upper));
  }

  /// \brief Find symbols by a range of addresses.
  ///
  /// \param Lower The lower-bounded address to look up.
  /// \param Upper The upper-bounded address to look up.
  ///
  /// \return A possibly empty constant range of all the symbols within the
  /// given address range. Searches the range [Lower, Upper).
  const_symbol_addr_range findSymbols(Addr Lower, Addr Upper) const {
    auto& Index = Symbols.get<by_address>();
    return boost::make_iterator_range(Index.lower_bound(Lower),
                                      Index.lower_bound(Upper));
  }

  /// \brief Find symbols by their referent object.
  ///
  /// \param Referent The object the symbol refers to.
  ///
  /// \return A possibly empty range of all the symbols that refer to the given
  /// object.
  symbol_ref_range findSymbols(const Node& Referent) {
    return Symbols.get<by_referent>().equal_range(&Referent);
  }

  /// \brief Find symbols by their referent object.
  ///
  /// \param Referent The object the symbol refers to.
  ///
  /// \return A possibly empty range of all the symbols that refer to the given
  /// object.
  const_symbol_ref_range findSymbols(const Node& Referent) const {
    return Symbols.get<by_referent>().equal_range(&Referent);
  }

  /// @}
  // (end group of symbol-related type aliases and functions)

  /// \brief Get the module name.
  ///
  /// \return The name.
  const std::string& getName() const { return Name; }

  /// \brief Set the module name.
  void setName(const std::string& X);

  /// \name Section-Related Public Types and Functions
  /// @{

  /// \brief Iterator over sections (\ref Section).
  using section_iterator = boost::indirect_iterator<SectionSet::iterator>;
  /// \brief Range of sections (\ref Section).
  using section_range = boost::iterator_range<section_iterator>;
  /// \brief Sub-range of sections overlapping an address (\ref Section).
  using section_subrange = boost::iterator_range<
      boost::indirect_iterator<SectionIntMap::codomain_type::iterator>>;
  /// \brief Iterator over sections (\ref Section).
  ///
  /// Sections are returned in name order. If two Sections have the same name,
  /// their order is not specified.
  using section_name_iterator =
      boost::indirect_iterator<SectionSet::index<by_name>::type::iterator>;
  /// \brief Range of sections (\ref Section).
  ///
  /// Sections are returned in name order. If two Sections have the same name,
  /// their order is not specified.
  using section_name_range = boost::iterator_range<section_name_iterator>;
  /// \brief Constant iterator over sections (\ref Section).
  ///
  /// Sections are returned in address order. If two Sections start at the
  /// same address, the smaller one is returned first. If two Sections have
  /// the same address and the same size, their order is not specified.
  using const_section_iterator =
      boost::indirect_iterator<SectionSet::const_iterator, const Section&>;
  /// \brief Constant range of sections (\ref Section).
  ///
  /// Sections are returned in address order. If two Sections start at the
  /// same address, the smaller one is returned first. If two Sections have
  /// the same address and the same size, their order is not specified.
  using const_section_range = boost::iterator_range<const_section_iterator>;
  /// \brief Sub-range of sections overlapping an address (\ref Section).
  using const_section_subrange = boost::iterator_range<boost::indirect_iterator<
      SectionIntMap::codomain_type::const_iterator, const Section&>>;
  /// \brief Constant iterator over sections (\ref Section).
  ///
  /// Sections are returned in name order. If two Sections have the same name,
  /// their order is not specified.
  using const_section_name_iterator =
      boost::indirect_iterator<SectionSet::index<by_name>::type::const_iterator,
                               const Section&>;
  /// \brief Constant range of sections (\ref Section).
  ///
  /// Sections are returned in name order. If two Sections have the same name,
  /// their order is not specified.
  using const_section_name_range =
      boost::iterator_range<const_section_name_iterator>;

  /// \brief Return an iterator to the first Section.
  section_iterator sections_begin() { return Sections.begin(); }
  /// \brief Return a constant iterator to the first Section.
  const_section_iterator sections_begin() const { return Sections.begin(); }
  /// \brief Return an iterator to the first Section.
  section_name_iterator sections_by_name_begin() {
    return Sections.get<by_name>().begin();
  }
  /// \brief Return a constant iterator to the first Section.
  const_section_name_iterator sections_by_name_begin() const {
    return Sections.get<by_name>().begin();
  }
  /// \brief Return an iterator to the element following the last Section.
  section_iterator sections_end() { return Sections.end(); }
  /// \brief Return a constant iterator to the element following the last
  /// Section.
  const_section_iterator sections_end() const { return Sections.end(); }
  /// \brief Return an iterator to the element following the last Section.
  section_name_iterator sections_by_name_end() {
    return Sections.get<by_name>().end();
  }
  /// \brief Return a constant iterator to the element following the last
  /// Section.
  const_section_name_iterator sections_by_name_end() const {
    return Sections.get<by_name>().end();
  }
  /// \brief Return a range of the sections (\ref Section).
  section_range sections() {
    return boost::make_iterator_range(sections_begin(), sections_end());
  }
  /// \brief Return a constant range of the sections (\ref Section).
  const_section_range sections() const {
    return boost::make_iterator_range(sections_begin(), sections_end());
  }

  /// \brief Remove a \ref Section object located in this module.
  ///
  /// \param S The \ref Section object to remove.
  ///
  /// \return Whether the operation succeeded (\c Accepted), made no change
  /// (\c NoChange), or could not be completed (\c Rejected). In particular,
  /// if the node to remove is not actually part of this node to begin with,
  /// the result will be \c NoChange.
  ChangeStatus removeSection(Section* S);

  /// \brief Move a \ref Section object to be located in this module.
  ///
  /// \param S The \ref Section object to add.
  ///
  /// \return a ChangeStatus indicating whether the insertion took place
  /// (\c Accepted), was unnecessary because this node already contained the
  // Section (\c NoChange), or could not be completed (\c Rejected).
  ChangeStatus addSection(Section* S);

  /// \brief Creates a new \ref Section in this module.
  ///
  /// \tparam Args  The arguments to construct a \ref Section.
  /// \param  C     The Context in which this object will be held.
  /// \param  A     The arguments to construct a \ref Section.
  ///
  /// \return the created Section.
  template <typename... Args> Section* addSection(Context& C, Args&&... A) {
    Section* S = Section::Create(C, std::forward<Args>(A)...);
    [[maybe_unused]] ChangeStatus status = addSection(S);
    // addSection(Section*) does not currently reject any changes and, because
    // we just created the Section to add, it cannot result in NoChange.
    assert(status == ChangeStatus::Accepted &&
           "unexpected result when inserting Section");
    return S;
  }

  /// \brief Find a Section containing an address.
  ///
  /// \param X The address to look up.
  ///
  /// \return The range of Sections containing the address.
  section_subrange findSectionsOn(Addr X) {
    if (auto It = SectionAddrs.find(X); It != SectionAddrs.end()) {
      return boost::make_iterator_range(It->second.begin(), It->second.end());
    }
    return {};
  }

  /// \brief Find a Section containing an address.
  ///
  /// \param X The address to look up.
  ///
  /// \return The range of Sections containing the address.
  const_section_subrange findSectionsOn(Addr X) const {
    if (auto It = SectionAddrs.find(X); It != SectionAddrs.end()) {
      return boost::make_iterator_range(It->second.begin(), It->second.end());
    }
    return {};
  }

  /// \brief Find all the sections that start at an address.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref Section objects that are at the address \p A.
  section_range findSectionsAt(Addr A) {
    auto Pair = Sections.get<by_address>().equal_range(A);
    return boost::make_iterator_range(section_iterator(Pair.first),
                                      section_iterator(Pair.second));
  }

  /// \brief Find all the sections that start between a range of addresses.
  ///
  /// \param Low  The low address, inclusive.
  /// \param High The high address, exclusive.
  ///
  /// \return A range of \ref Section objects that are between the addresses.
  section_range findSectionsAt(Addr Low, Addr High) {
    auto& Index = Sections.get<by_address>();
    return boost::make_iterator_range(
        section_iterator(Index.lower_bound(Low)),
        section_iterator(Index.lower_bound(High)));
  }

  /// \brief Find all the sections that start at an address.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref Section objects that are at the address \p A.
  const_section_range findSectionsAt(Addr A) const {
    auto Pair = Sections.get<by_address>().equal_range(A);
    return boost::make_iterator_range(const_section_iterator(Pair.first),
                                      const_section_iterator(Pair.second));
  }

  /// \brief Find all the sections that start between a range of addresses.
  ///
  /// \param Low  The low address, inclusive.
  /// \param High The high address, exclusive.
  ///
  /// \return A range of \ref Section objects that are between the addresses.
  const_section_range findSectionsAt(Addr Low, Addr High) const {
    auto& Index = Sections.get<by_address>();
    return boost::make_iterator_range(
        const_section_iterator(Index.lower_bound(Low)),
        const_section_iterator(Index.lower_bound(High)));
  }

  /// \brief Find a Section by name.
  ///
  /// \param X The name to look up.
  ///
  /// \return A range of \ref Section objects with the requested name.

  section_name_range findSections(const std::string& X) {
    auto Pair = Sections.get<by_name>().equal_range(X);
    return boost::make_iterator_range(section_name_iterator(Pair.first),
                                      section_name_iterator(Pair.second));
  }

  /// \brief Find a Section by name.
  ///
  /// \param X The name to look up.
  ///
  /// \return A range of \ref Section objects with the requested name.
  const_section_name_range findSections(const std::string& X) const {
    auto Pair = Sections.get<by_name>().equal_range(X);
    return boost::make_iterator_range(const_section_name_iterator(Pair.first),
                                      const_section_name_iterator(Pair.second));
  }

  /// @}
  // (end group of Section-related types and functions)

  /// \name ByteInterval-Related Public Types and Functions
  /// @{

  /// \brief Iterator over \ref ByteInterval objects.
  using byte_interval_iterator =
      MergeSortedIterator<Section::byte_interval_iterator, AddressLess>;
  /// \brief Range of \ref ByteInterval objects.
  using byte_interval_range = boost::iterator_range<byte_interval_iterator>;
  /// \brief Sub-range of \ref ByteInterval objects overlapping addresses.
  using byte_interval_subrange = boost::iterator_range<MergeSortedIterator<
      Section::byte_interval_subrange::iterator, AddressLess>>;
  /// \brief Const iterator over \ref ByteInterval objects.
  using const_byte_interval_iterator =
      MergeSortedIterator<Section::const_byte_interval_iterator, AddressLess>;
  /// \brief Const range of \ref ByteInterval objects.
  using const_byte_interval_range =
      boost::iterator_range<const_byte_interval_iterator>;
  /// \brief Sub-range of \ref ByteInterval objects overlapping addresses.
  using const_byte_interval_subrange =
      boost::iterator_range<MergeSortedIterator<
          Section::const_byte_interval_subrange::iterator, AddressLess>>;

  /// \brief Return an iterator to the first \ref ByteInterval.
  byte_interval_iterator byte_intervals_begin() {
    return byte_interval_iterator(
        boost::make_transform_iterator(this->sections_begin(),
                                       NodeToByteIntervalRange<Section>()),
        boost::make_transform_iterator(this->sections_end(),
                                       NodeToByteIntervalRange<Section>()));
  }

  /// \brief Return an iterator to the element following the last \ref
  /// ByteInterval.
  byte_interval_iterator byte_intervals_end() {
    return byte_interval_iterator();
  }

  /// \brief Return a range of all the \ref ByteInterval objects.
  byte_interval_range byte_intervals() {
    return boost::make_iterator_range(byte_intervals_begin(),
                                      byte_intervals_end());
  }

  /// \brief Return an iterator to the first \ref ByteInterval.
  const_byte_interval_iterator byte_intervals_begin() const {
    return const_byte_interval_iterator(
        boost::make_transform_iterator(
            this->sections_begin(), NodeToByteIntervalRange<const Section>()),
        boost::make_transform_iterator(
            this->sections_end(), NodeToByteIntervalRange<const Section>()));
  }

  /// \brief Return an iterator to the element following the last \ref
  /// ByteInterval.
  const_byte_interval_iterator byte_intervals_end() const {
    return const_byte_interval_iterator();
  }

  /// \brief Return a range of all the \ref ByteInterval objects.
  const_byte_interval_range byte_intervals() const {
    return boost::make_iterator_range(byte_intervals_begin(),
                                      byte_intervals_end());
  }

  /// \brief Find all the intervals that contain the address specified.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref ByteInterval objects that intersect the address \p
  /// A.
  byte_interval_subrange findByteIntervalsOn(Addr A) {
    section_subrange Range = findSectionsOn(A);
    return byte_interval_subrange(
        byte_interval_subrange::iterator(
            boost::make_transform_iterator(Range.begin(),
                                           FindByteIntervalsIn<Section>(A)),
            boost::make_transform_iterator(Range.end(),
                                           FindByteIntervalsIn<Section>(A))),
        byte_interval_subrange::iterator());
  }

  /// \brief Find all the intervals that contain the address specified.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref ByteInterval objects that intersect the address \p
  /// A.
  const_byte_interval_subrange findByteIntervalsOn(Addr A) const {
    const_section_subrange Range = findSectionsOn(A);
    return const_byte_interval_subrange(
        const_byte_interval_subrange::iterator(
            boost::make_transform_iterator(
                Range.begin(), FindByteIntervalsIn<const Section>(A)),
            boost::make_transform_iterator(
                Range.end(), FindByteIntervalsIn<const Section>(A))),
        const_byte_interval_subrange::iterator());
  }

  /// \brief Find all the intervals that start at an address.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref ByteInterval objects that are at the address \p A.
  byte_interval_range findByteIntervalsAt(Addr A) {
    section_subrange Range = findSectionsOn(A);
    return byte_interval_range(
        byte_interval_range::iterator(
            boost::make_transform_iterator(Range.begin(),
                                           FindByteIntervalsAt<Section>(A)),
            boost::make_transform_iterator(Range.end(),
                                           FindByteIntervalsAt<Section>(A))),
        byte_interval_range::iterator());
  }

  /// \brief Find all the intervals that start between a range of addresses.
  ///
  /// \param Low  The low address, inclusive.
  /// \param High The high address, exclusive.
  ///
  /// \return A range of \ref ByteInterval objects that are between the
  /// addresses.
  byte_interval_range findByteIntervalsAt(Addr Low, Addr High) {
    std::vector<Section::byte_interval_range> Ranges;
    for (Section& S : findSectionsOn(Low))
      Ranges.push_back(S.findByteIntervalsAt(Low, High));
    for (Section& S : findSectionsAt(Low + 1, High))
      Ranges.push_back(S.findByteIntervalsAt(Low, High));
    return byte_interval_range(byte_interval_iterator(Ranges),
                               byte_interval_iterator());
  }

  /// \brief Find all the intervals that start at an address.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref ByteInterval objects that are at the address \p A.
  const_byte_interval_range findByteIntervalsAt(Addr A) const {
    const_section_subrange Range = findSectionsOn(A);
    return const_byte_interval_range(
        const_byte_interval_range::iterator(
            boost::make_transform_iterator(
                Range.begin(), FindByteIntervalsAt<const Section>(A)),
            boost::make_transform_iterator(
                Range.end(), FindByteIntervalsAt<const Section>(A))),
        const_byte_interval_range::iterator());
  }

  /// \brief Find all the intervals that start between a range of addresses.
  ///
  /// \param Low  The low address, inclusive.
  /// \param High The high address, exclusive.
  ///
  /// \return A range of \ref ByteInterval objects that are between the
  /// addresses.
  const_byte_interval_range findByteIntervalsAt(Addr Low, Addr High) const {
    std::vector<Section::const_byte_interval_range> Ranges;
    for (const Section& S : findSectionsOn(Low))
      Ranges.push_back(S.findByteIntervalsAt(Low, High));
    for (const Section& S : findSectionsAt(Low + 1, High))
      Ranges.push_back(S.findByteIntervalsAt(Low, High));
    return const_byte_interval_range(const_byte_interval_iterator(Ranges),
                                     const_byte_interval_iterator());
  }
  /// @}
  // (end group of ByteInterval-related types and functions)

  /// \name Block-Related Public Types and Functions
  /// @{

  /// \brief Iterator over blocks.
  ///
  /// Blocks are yielded in address order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".
  using block_iterator =
      MergeSortedIterator<Section::block_iterator, BlockAddressLess>;
  /// \brief Range of blocks.
  ///
  /// Blocks are yielded in address order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".
  using block_range = boost::iterator_range<block_iterator>;
  /// \brief Sub-range of blocks overlapping an address or range of addreses.
  ///
  /// Blocks are yielded in address order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".
  using block_subrange = boost::iterator_range<
      MergeSortedIterator<Section::block_subrange::iterator, BlockAddressLess>>;
  /// \brief Iterator over blocks.
  ///
  /// Blocks are yielded in address order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".
  using const_block_iterator =
      MergeSortedIterator<Section::const_block_iterator, BlockAddressLess>;
  /// \brief Range of blocks.
  ///
  /// Blocks are yielded in address order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".
  using const_block_range = boost::iterator_range<const_block_iterator>;
  /// \brief Sub-range of blocks overlapping an address or range of addreses.
  ///
  /// Blocks are yielded in address order, ascending.
  using const_block_subrange = boost::iterator_range<MergeSortedIterator<
      Section::const_block_subrange::iterator, BlockAddressLess>>;

  /// \brief Return an iterator to the first block.
  block_iterator blocks_begin() {
    return block_iterator(
        boost::make_transform_iterator(this->sections_begin(),
                                       NodeToBlockRange<Section>()),
        boost::make_transform_iterator(this->sections_end(),
                                       NodeToBlockRange<Section>()));
  }

  /// \brief Return an iterator to the element following the last block.
  block_iterator blocks_end() { return block_iterator(); }

  /// \brief Return a range of all the blocks.
  block_range blocks() {
    return boost::make_iterator_range(blocks_begin(), blocks_end());
  }

  /// \brief Return an iterator to the first block.
  const_block_iterator blocks_begin() const {
    return const_block_iterator(
        boost::make_transform_iterator(this->sections_begin(),
                                       NodeToBlockRange<const Section>()),
        boost::make_transform_iterator(this->sections_end(),
                                       NodeToBlockRange<const Section>()));
  }

  /// \brief Return an iterator to the element following the last block.
  const_block_iterator blocks_end() const { return const_block_iterator(); }

  /// \brief Return a range of all the blocks.
  const_block_range blocks() const {
    return boost::make_iterator_range(blocks_begin(), blocks_end());
  }

  /// \brief Find all the blocks that have bytes that lie within the address
  /// specified.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref Node objects, which are either \ref DataBlock
  /// objects or \ref CodeBlock objects, that intersect the address \p A.
  block_subrange findBlocksOn(Addr A) {
    section_subrange SectionRange = findSectionsOn(A);
    return block_subrange(
        block_subrange::iterator(
            boost::make_transform_iterator(SectionRange.begin(),
                                           FindBlocksIn<Section>(A)),
            boost::make_transform_iterator(SectionRange.end(),
                                           FindBlocksIn<Section>(A))),
        block_subrange::iterator());
  }

  /// \brief Find all the blocks that have bytes that lie within the address
  /// specified.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref Node objects, which are either \ref DataBlock
  /// objects or \ref CodeBlock objects, that intersect the address \p A.
  const_block_subrange findBlocksOn(Addr A) const {
    const_section_subrange SectionRange = findSectionsOn(A);
    return const_block_subrange(
        const_block_subrange::iterator(
            boost::make_transform_iterator(SectionRange.begin(),
                                           FindBlocksIn<const Section>(A)),
            boost::make_transform_iterator(SectionRange.end(),
                                           FindBlocksIn<const Section>(A))),
        const_block_subrange::iterator());
  }

  /// \brief Find all the blocks that start at an address.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref Node objects, which are either \ref DataBlock
  /// objects or \ref CodeBlock objects, that are at the address \p A.
  block_range findBlocksAt(Addr A) {
    section_subrange SectionRange = findSectionsOn(A);
    return block_range(block_range::iterator(
                           boost::make_transform_iterator(
                               SectionRange.begin(), FindBlocksAt<Section>(A)),
                           boost::make_transform_iterator(
                               SectionRange.end(), FindBlocksAt<Section>(A))),
                       block_range::iterator());
  }

  /// \brief Find all the blocks that start between a range of addresses.
  ///
  /// \param Low  The low address, inclusive.
  /// \param High The high address, exclusive.
  ///
  /// \return A range of \ref Node objects, which are either \ref DataBlock
  /// objects or \ref CodeBlock objects, that are between the addresses.
  block_range findBlocksAt(Addr Low, Addr High) {
    std::vector<Section::block_range> Ranges;
    for (Section& S : findSectionsOn(Low))
      Ranges.push_back(S.findBlocksAt(Low, High));
    for (Section& S : findSectionsAt(Low + 1, High))
      Ranges.push_back(S.findBlocksAt(Low, High));
    return block_range(block_iterator(Ranges), block_iterator());
  }

  /// \brief Find all the blocks that start at an address.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref Node objects, which are either \ref DataBlock
  /// objects or \ref CodeBlock objects, that are at the address \p A.
  const_block_range findBlocksAt(Addr A) const {
    const_section_subrange SectionRange = findSectionsOn(A);
    return const_block_range(
        const_block_range::iterator(
            boost::make_transform_iterator(SectionRange.begin(),
                                           FindBlocksAt<const Section>(A)),
            boost::make_transform_iterator(SectionRange.end(),
                                           FindBlocksAt<const Section>(A))),
        const_block_range::iterator());
  }

  /// \brief Find all the blocks that start between a range of addresses.
  ///
  /// \param Low  The low address, inclusive.
  /// \param High The high address, exclusive.
  ///
  /// \return A range of \ref Node objects, which are either \ref DataBlock
  /// objects or \ref CodeBlock objects, that are between the addresses.
  const_block_range findBlocksAt(Addr Low, Addr High) const {
    std::vector<Section::const_block_range> Ranges;
    for (const Section& S : findSectionsOn(Low))
      Ranges.push_back(S.findBlocksAt(Low, High));
    for (const Section& S : findSectionsAt(Low + 1, High))
      Ranges.push_back(S.findBlocksAt(Low, High));
    return const_block_range(const_block_iterator(Ranges),
                             const_block_iterator());
  }
  /// @}
  // (end group of Block-related types and functions)

  /// \name CodeBlock-Related Public Types and Functions
  /// @{

  /// \brief Iterator over \ref CodeBlock objects.
  ///
  /// Blocks are yielded in address order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".
  using code_block_iterator =
      MergeSortedIterator<Section::code_block_iterator, AddressLess>;
  /// \brief Range of \ref CodeBlock objects.
  ///
  /// Blocks are yielded in address order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".
  using code_block_range = boost::iterator_range<code_block_iterator>;
  /// \brief Sub-range of \ref CodeBlock objects overlapping an address or range
  /// of addreses.
  ///
  /// Blocks are yielded in address order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".
  using code_block_subrange = boost::iterator_range<
      MergeSortedIterator<Section::code_block_subrange::iterator, AddressLess>>;
  /// \brief Iterator over \ref CodeBlock objects.
  ///
  /// Blocks are yielded in address order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".
  using const_code_block_iterator =
      MergeSortedIterator<Section::const_code_block_iterator, AddressLess>;
  /// \brief Range of \ref CodeBlock objects.
  ///
  /// Blocks are yielded in address order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".
  using const_code_block_range =
      boost::iterator_range<const_code_block_iterator>;
  /// \brief Sub-range of \ref CodeBlock objects overlapping an address or range
  /// of addreses.
  ///
  /// Blocks are yielded in address order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".
  using const_code_block_subrange = boost::iterator_range<MergeSortedIterator<
      Section::const_code_block_subrange::iterator, AddressLess>>;

private:
  code_block_range makeCodeBlockRange(SectionSet::iterator Begin,
                                      SectionSet::iterator End) {
    NodeToCodeBlockRange<Section> Transformer;
    return boost::make_iterator_range(
        code_block_iterator(
            boost::make_transform_iterator(section_iterator(Begin),
                                           Transformer),
            boost::make_transform_iterator(section_iterator(End), Transformer)),
        code_block_iterator());
  }

public:
  /// \brief Return an iterator to the first \ref CodeBlock.
  code_block_iterator code_blocks_begin() {
    return code_block_iterator(
        boost::make_transform_iterator(this->sections_begin(),
                                       NodeToCodeBlockRange<Section>()),
        boost::make_transform_iterator(this->sections_end(),
                                       NodeToCodeBlockRange<Section>()));
  }

  /// \brief Return an iterator to the element following the last \ref
  /// CodeBlock.
  code_block_iterator code_blocks_end() { return code_block_iterator(); }

  /// \brief Return a range of all the \ref CodeBlock objects.
  code_block_range code_blocks() {
    return boost::make_iterator_range(code_blocks_begin(), code_blocks_end());
  }

  /// \brief Return an iterator to the first \ref CodeBlock.
  const_code_block_iterator code_blocks_begin() const {
    return const_code_block_iterator(
        boost::make_transform_iterator(this->sections_begin(),
                                       NodeToCodeBlockRange<const Section>()),
        boost::make_transform_iterator(this->sections_end(),
                                       NodeToCodeBlockRange<const Section>()));
  }

  /// \brief Return an iterator to the element following the last \ref
  /// CodeBlock.
  const_code_block_iterator code_blocks_end() const {
    return const_code_block_iterator();
  }

  /// \brief Return a range of all the \ref CodeBlock objects.
  const_code_block_range code_blocks() const {
    return boost::make_iterator_range(code_blocks_begin(), code_blocks_end());
  }

  /// \brief Find all the code blocks that have bytes that lie within the
  /// address specified.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref CodeNode object that intersect the address \p A.
  code_block_subrange findCodeBlocksOn(Addr A) {
    section_subrange Range = findSectionsOn(A);
    return code_block_subrange(
        code_block_subrange::iterator(
            boost::make_transform_iterator(Range.begin(),
                                           FindCodeBlocksIn<Section>(A)),
            boost::make_transform_iterator(Range.end(),
                                           FindCodeBlocksIn<Section>(A))),
        code_block_subrange::iterator());
  }

  /// \brief Find all the code blocks that have bytes that lie within the
  /// address specified.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref CodeBlock objects that intersect the address \p A.
  const_code_block_subrange findCodeBlocksOn(Addr A) const {
    const_section_subrange Range = findSectionsOn(A);
    return const_code_block_subrange(
        const_code_block_subrange::iterator(
            boost::make_transform_iterator(Range.begin(),
                                           FindCodeBlocksIn<const Section>(A)),
            boost::make_transform_iterator(Range.end(),
                                           FindCodeBlocksIn<const Section>(A))),
        const_code_block_subrange::iterator());
  }

  /// \brief Find all the code blocks that start at an address.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref CodeBlock objects that are at the address \p A.
  code_block_range findCodeBlocksAt(Addr A) {
    section_subrange Range = findSectionsOn(A);
    return code_block_range(
        code_block_range::iterator(
            boost::make_transform_iterator(Range.begin(),
                                           FindCodeBlocksAt<Section>(A)),
            boost::make_transform_iterator(Range.end(),
                                           FindCodeBlocksAt<Section>(A))),
        code_block_range::iterator());
  }

  /// \brief Find all the code blocks that start between a range of addresses.
  ///
  /// \param Low  The low address, inclusive.
  /// \param High The high address, exclusive.
  ///
  /// \return A range of \ref CodeBlock objects that are between the addresses.
  code_block_range findCodeBlocksAt(Addr Low, Addr High) {
    std::vector<Section::code_block_range> Ranges;
    for (Section& S : findSectionsOn(Low))
      Ranges.push_back(S.findCodeBlocksAt(Low, High));
    for (Section& S : findSectionsAt(Low + 1, High))
      Ranges.push_back(S.findCodeBlocksAt(Low, High));
    return code_block_range(code_block_iterator(Ranges), code_block_iterator());
  }

  /// \brief Find all the code blocks that start at an address.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref CodeBlock objects that are at the address \p A.
  const_code_block_range findCodeBlocksAt(Addr A) const {
    const_section_subrange Range = findSectionsOn(A);
    return const_code_block_range(
        const_code_block_range::iterator(
            boost::make_transform_iterator(Range.begin(),
                                           FindCodeBlocksAt<const Section>(A)),
            boost::make_transform_iterator(Range.end(),
                                           FindCodeBlocksAt<const Section>(A))),
        const_code_block_range::iterator());
  }

  /// \brief Find all the code blocks that start between a range of addresses.
  ///
  /// \param Low  The low address, inclusive.
  /// \param High The high address, exclusive.
  ///
  /// \return A range of \ref CodeBlock objects that are between the addresses.
  const_code_block_range findCodeBlocksAt(Addr Low, Addr High) const {
    std::vector<Section::const_code_block_range> Ranges;
    for (const Section& S : findSectionsOn(Low))
      Ranges.push_back(S.findCodeBlocksAt(Low, High));
    for (const Section& S : findSectionsAt(Low + 1, High))
      Ranges.push_back(S.findCodeBlocksAt(Low, High));
    return const_code_block_range(const_code_block_iterator(Ranges),
                                  const_code_block_iterator());
  }
  /// @}
  // (end group of CodeBlock-related types and functions)

  /// \name DataBlock-Related Public Types and Functions
  /// @{

  /// \brief Iterator over \ref DataBlock objects.
  ///
  /// Blocks are yielded in address order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".
  using data_block_iterator =
      MergeSortedIterator<Section::data_block_iterator, AddressLess>;
  /// \brief Range of \ref DataBlock objects.
  ///
  /// Blocks are yielded in address order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".
  using data_block_range = boost::iterator_range<data_block_iterator>;
  /// \brief Sub-range of \ref DataBlock objects overlapping an address or range
  /// of addreses.
  ///
  /// Blocks are yielded in address order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".
  using data_block_subrange = boost::iterator_range<
      MergeSortedIterator<Section::data_block_subrange::iterator, AddressLess>>;
  /// \brief Iterator over \ref DataBlock objects.
  ///
  /// Blocks are yielded in address order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".
  using const_data_block_iterator =
      MergeSortedIterator<Section::const_data_block_iterator, AddressLess>;
  /// \brief Range of \ref DataBlock objects.
  ///
  /// Blocks are yielded in address order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".
  using const_data_block_range =
      boost::iterator_range<const_data_block_iterator>;
  /// \brief Sub-range of \ref DataBlock objects overlapping an address or range
  /// of addreses.
  ///
  /// Blocks are yielded in address order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".
  using const_data_block_subrange = boost::iterator_range<MergeSortedIterator<
      Section::const_data_block_subrange::iterator, AddressLess>>;

  /// \brief Return an iterator to the first \ref DataBlock.
  data_block_iterator data_blocks_begin() {
    return data_block_iterator(
        boost::make_transform_iterator(this->sections_begin(),
                                       NodeToDataBlockRange<Section>()),
        boost::make_transform_iterator(this->sections_end(),
                                       NodeToDataBlockRange<Section>()));
  }

  /// \brief Return an iterator to the element following the last \ref
  /// DataBlock.
  data_block_iterator data_blocks_end() { return data_block_iterator(); }

  /// \brief Return a range of all the \ref DataBlock objects.
  data_block_range data_blocks() {
    return boost::make_iterator_range(data_blocks_begin(), data_blocks_end());
  }

  /// \brief Return an iterator to the first \ref DataBlock.
  const_data_block_iterator data_blocks_begin() const {
    return const_data_block_iterator(
        boost::make_transform_iterator(this->sections_begin(),
                                       NodeToDataBlockRange<const Section>()),
        boost::make_transform_iterator(this->sections_end(),
                                       NodeToDataBlockRange<const Section>()));
  }

  /// \brief Return an iterator to the element following the last \ref
  /// DataBlock.
  const_data_block_iterator data_blocks_end() const {
    return const_data_block_iterator();
  }

  /// \brief Return a range of all the \ref DataBlock objects.
  const_data_block_range data_blocks() const {
    return boost::make_iterator_range(data_blocks_begin(), data_blocks_end());
  }

  /// \brief Find all the data blocks that have bytes that lie within the
  /// address specified.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref DataNode object that intersect the address \p A.
  data_block_subrange findDataBlocksOn(Addr A) {
    section_subrange Range = findSectionsOn(A);
    return data_block_subrange(
        data_block_subrange::iterator(
            boost::make_transform_iterator(Range.begin(),
                                           FindDataBlocksIn<Section>(A)),
            boost::make_transform_iterator(Range.end(),
                                           FindDataBlocksIn<Section>(A))),
        data_block_subrange::iterator());
  }

  /// \brief Find all the data blocks that have bytes that lie within the
  /// address specified.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref DataNode object that intersect the address \p A.
  const_data_block_subrange findDataBlocksOn(Addr A) const {
    const_section_subrange Range = findSectionsOn(A);
    return const_data_block_subrange(
        const_data_block_subrange::iterator(
            boost::make_transform_iterator(Range.begin(),
                                           FindDataBlocksIn<const Section>(A)),
            boost::make_transform_iterator(Range.end(),
                                           FindDataBlocksIn<const Section>(A))),
        const_data_block_subrange::iterator());
  }

  /// \brief Find all the data blocks that start at an address.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref DataBlock objects that are at the address \p A.
  data_block_range findDataBlocksAt(Addr A) {
    section_subrange Range = findSectionsOn(A);
    return data_block_range(
        data_block_range::iterator(
            boost::make_transform_iterator(Range.begin(),
                                           FindDataBlocksAt<Section>(A)),
            boost::make_transform_iterator(Range.end(),
                                           FindDataBlocksAt<Section>(A))),
        data_block_range::iterator());
  }

  /// \brief Find all the data blocks that start between a range of addresses.
  ///
  /// \param Low  The low address, inclusive.
  /// \param High The high address, exclusive.
  ///
  /// \return A range of \ref DataBlock objects that are between the addresses.
  data_block_range findDataBlocksAt(Addr Low, Addr High) {
    std::vector<Section::data_block_range> Ranges;
    for (Section& S : findSectionsOn(Low))
      Ranges.push_back(S.findDataBlocksAt(Low, High));
    for (Section& S : findSectionsAt(Low + 1, High))
      Ranges.push_back(S.findDataBlocksAt(Low, High));
    return data_block_range(data_block_iterator(Ranges), data_block_iterator());
  }

  /// \brief Find all the data blocks that start at an address.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref DataBlock objects that are at the address \p A.
  const_data_block_range findDataBlocksAt(Addr A) const {
    const_section_subrange Range = findSectionsOn(A);
    return const_data_block_range(
        const_data_block_range::iterator(
            boost::make_transform_iterator(Range.begin(),
                                           FindDataBlocksAt<const Section>(A)),
            boost::make_transform_iterator(Range.end(),
                                           FindDataBlocksAt<const Section>(A))),
        const_data_block_range::iterator());
  }

  /// \brief Find all the data blocks that start between a range of addresses.
  ///
  /// \param Low  The low address, inclusive.
  /// \param High The high address, exclusive.
  ///
  /// \return A range of \ref DataBlock objects that are between the addresses.
  const_data_block_range findDataBlocksAt(Addr Low, Addr High) const {
    std::vector<Section::const_data_block_range> Ranges;
    for (const Section& S : findSectionsOn(Low))
      Ranges.push_back(S.findDataBlocksAt(Low, High));
    for (const Section& S : findSectionsAt(Low + 1, High))
      Ranges.push_back(S.findDataBlocksAt(Low, High));
    return const_data_block_range(const_data_block_iterator(Ranges),
                                  const_data_block_iterator());
  }
  /// @}
  // (end group of DataBlock-related types and functions)

  /// \name SymbolicExpression-Related Public Types and Functions
  /// @{

  /// \brief Iterator over \ref SymbolicExpressionElement objects.
  ///
  /// Results are yielded in address order, ascending.
  using symbolic_expression_iterator =
      MergeSortedIterator<Section::symbolic_expression_iterator,
                          ByteInterval::SymbolicExpressionElement::AddressLess>;
  /// \brief Range of \ref SymbolicExpressionElement objects.
  ///
  /// Results are yielded in address order, ascending.
  using symbolic_expression_range =
      boost::iterator_range<symbolic_expression_iterator>;
  /// \brief Iterator over \ref SymbolicExpressionElement objects.
  ///
  /// Results are yielded in address order, ascending.
  using const_symbolic_expression_iterator = MergeSortedIterator<
      Section::const_symbolic_expression_iterator,
      ByteInterval::ConstSymbolicExpressionElement::AddressLess>;
  /// \brief Range of \ref SymbolicExpressionElement objects.
  ///
  /// Results are yielded in address order, ascending.
  using const_symbolic_expression_range =
      boost::iterator_range<const_symbolic_expression_iterator>;

  /// \brief Return an iterator to the first \ref SymbolicExpression.
  symbolic_expression_iterator symbolic_expressions_begin() {
    return symbolic_expression_iterator(
        boost::make_transform_iterator(
            this->sections_begin(), NodeToSymbolicExpressionRange<Section>()),
        boost::make_transform_iterator(
            this->sections_end(), NodeToSymbolicExpressionRange<Section>()));
  }

  /// \brief Return an iterator to the element following the last \ref
  /// SymbolicExpression.
  symbolic_expression_iterator symbolic_expressions_end() {
    return symbolic_expression_iterator();
  }

  /// \brief Return a range of all the \ref SymbolicExpression objects.
  symbolic_expression_range symbolic_expressions() {
    return boost::make_iterator_range(symbolic_expressions_begin(),
                                      symbolic_expressions_end());
  }

  /// \brief Return an iterator to the first \ref SymbolicExpression.
  const_symbolic_expression_iterator symbolic_expressions_begin() const {
    return const_symbolic_expression_iterator(
        boost::make_transform_iterator(
            this->sections_begin(),
            NodeToSymbolicExpressionRange<const Section>()),
        boost::make_transform_iterator(
            this->sections_end(),
            NodeToSymbolicExpressionRange<const Section>()));
  }

  /// \brief Return an iterator to the element following the last \ref
  /// SymbolicExpression.
  const_symbolic_expression_iterator symbolic_expressions_end() const {
    return const_symbolic_expression_iterator();
  }

  /// \brief Return a range of all the \ref SymbolicExpression objects.
  const_symbolic_expression_range symbolic_expressions() const {
    return boost::make_iterator_range(symbolic_expressions_begin(),
                                      symbolic_expressions_end());
  }

  /// \brief Find all the symbolic expressions that start at an address.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref SymbolicExpression objects that are at the address
  /// \p A.
  symbolic_expression_range findSymbolicExpressionsAt(Addr A) {
    return symbolic_expression_range(
        symbolic_expression_range::iterator(
            boost::make_transform_iterator(this->sections_begin(),
                                           FindSymExprsAt<Section>(A)),
            boost::make_transform_iterator(this->sections_end(),
                                           FindSymExprsAt<Section>(A))),
        symbolic_expression_range::iterator());
  }

  /// \brief Find all the symbolic expressions that start between a range of
  /// addresses.
  ///
  /// \param Low  The low address, inclusive.
  /// \param High The high address, exclusive.
  ///
  /// \return A range of \ref SymbolicExpression objects that are between the
  /// addresses.
  symbolic_expression_range findSymbolicExpressionsAt(Addr Low, Addr High) {
    return symbolic_expression_range(
        symbolic_expression_range::iterator(
            boost::make_transform_iterator(
                this->sections_begin(),
                FindSymExprsBetween<Section>(Low, High)),
            boost::make_transform_iterator(
                this->sections_end(), FindSymExprsBetween<Section>(Low, High))),
        symbolic_expression_range::iterator());
  }

  /// \brief Find all the symbolic expressions that start at an address.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref SymbolicExpression objects that are at the address
  /// \p A.
  const_symbolic_expression_range findSymbolicExpressionsAt(Addr A) const {
    return const_symbolic_expression_range(
        const_symbolic_expression_range::iterator(
            boost::make_transform_iterator(this->sections_begin(),
                                           FindSymExprsAt<const Section>(A)),
            boost::make_transform_iterator(this->sections_end(),
                                           FindSymExprsAt<const Section>(A))),
        const_symbolic_expression_range::iterator());
  }

  /// \brief Find all the symbolic expressions that start between a range of
  /// addresses.
  ///
  /// \param Low  The low address, inclusive.
  /// \param High The high address, exclusive.
  ///
  /// \return A range of \ref SymbolicExpression objects that are between the
  /// addresses.
  const_symbolic_expression_range findSymbolicExpressionsAt(Addr Low,
                                                            Addr High) const {
    return const_symbolic_expression_range(
        const_symbolic_expression_range::iterator(
            boost::make_transform_iterator(
                this->sections_begin(),
                FindSymExprsBetween<const Section>(Low, High)),
            boost::make_transform_iterator(
                this->sections_end(),
                FindSymExprsBetween<const Section>(Low, High))),
        const_symbolic_expression_range::iterator());
  }
  /// @}
  // (end group of SymbolicExpression-related types and functions)

  /// @cond INTERNAL
  static bool classof(const Node* N) { return N->getKind() == Kind::Module; }
  /// @endcond

private:
  /// \brief The protobuf message type used for serializing Module.
  using MessageType = proto::Module;

  /// \brief Remove a Section from SectionAddrs.
  void removeSectionAddrs(Section* S);

  /// \brief Add a Section to SectionAddrs.
  ///
  /// The caller is responsible for ensuring that the Section is owned by this
  /// Module.
  void insertSectionAddrs(Section* S);

  /// \brief Serialize into a protobuf message.
  ///
  /// \param[out] Message   Serialize into this message.
  ///
  /// \return void
  void toProtobuf(MessageType* Message) const;

  /// \brief Construct a Module from a protobuf message.
  ///
  /// \param C   The Context in which the deserialized Module will be held.
  /// \param Message  The protobuf message from which to deserialize.
  ///
  /// \return The deserialized Module object, or null on failure.
  static ErrorOr<Module*> fromProtobuf(Context& C, const MessageType& Message);

  // Present for testing purposes only.
  void save(std::ostream& Out) const;

  // Present for testing purposes only.
  static Module* load(Context& C, std::istream& In);

  void setParent(IR* I, ModuleObserver* O) {
    Parent = I;
    Observer = O;
  }

  IR* Parent{nullptr};
  ModuleObserver* Observer{nullptr};
  std::string BinaryPath;
  Addr PreferredAddr;
  int64_t RebaseDelta{0};
  gtirb::FileFormat FileFormat{FileFormat::Undefined};
  gtirb::ISA Isa{ISA::Undefined};
  gtirb::ByteOrder ByteOrder{ByteOrder::Undefined};
  std::string Name;
  CodeBlock* EntryPoint{nullptr};
  ProxyBlockSet ProxyBlocks;
  SectionSet Sections;
  SectionIntMap SectionAddrs;
  SymbolSet Symbols;

  std::unique_ptr<SectionObserver> SecObs;
  std::unique_ptr<SymbolObserver> SymObs;

  friend class Context; // Allow Context to construct new Modules.
  friend class IR;      // Allow IRs to call setIR, Create, etc.
  // Allow serialization from IR via containerToProtobuf.
  template <typename T> friend typename T::MessageType toProtobuf(const T&);
  friend class SerializationTestHarness; // Testing support.
};

/// \class ModuleObserver
///
/// \brief Interface for notifying observers when the Module is updated.
///

class GTIRB_EXPORT_API ModuleObserver {
public:
  virtual ~ModuleObserver() = default;

  /// \brief Notify the parent when this Module's name changes.
  ///
  /// Called after the Module updates its internal state.
  ///
  /// \param M        the Module whose name changed.
  /// \param OldName  the Module's previous name.
  /// \param NewName  the new name of this Module.
  virtual ChangeStatus nameChange(Module* M, const std::string& OldName,
                                  const std::string& NewName) = 0;

  /// \brief Notify the parent when new ProxyBlocks are added to the Module.
  ///
  /// Called after the Module updates its internal state.
  ///
  /// \param M       the Module to which the ProxyBlocks were added.
  /// \param Blocks  a range containing the new ProxyBlocks.
  virtual ChangeStatus addProxyBlocks(Module* M,
                                      Module::proxy_block_range Blocks) = 0;

  /// \brief Notify the parent when ProxyBlocks are removed from the Module.
  ///
  /// Called before the Module updates its internal state.
  ///
  /// \param M       the Module from which ProxyBlocks will be removed.
  /// \param Blocks  a range containing ProxyBlocks to remove.
  virtual ChangeStatus removeProxyBlocks(Module* M,
                                         Module::proxy_block_range Blocks) = 0;

  /// \brief Notify the parent when CodeBlocks are added to the Module.
  ///
  /// Called after the Module updates its internal state.
  ///
  /// \param M       the Module to which CodeBlocks were added.
  /// \param Blocks  a range containing the new CodeBlocks.
  virtual ChangeStatus addCodeBlocks(Module* M,
                                     Module::code_block_range Blocks) = 0;

  /// \brief Notify the parent when CodeBlocks are removed from the Module.
  ///
  /// Called before the Module updates its internal state.
  ///
  /// \param M       the Module from which CodeBlocks will be removed.
  /// \param Blocks  a range containing the CodeBlocks to remove.
  virtual ChangeStatus removeCodeBlocks(Module* M,
                                        Module::code_block_range Blocks) = 0;
};

inline void Module::setName(const std::string& X) {
  if (Observer) {
    std::string OldName = X;
    std::swap(Name, OldName);
    [[maybe_unused]] ChangeStatus status =
        Observer->nameChange(this, OldName, Name);
    // The known observers do not reject insertions. If that changes, this
    // method must be updated.
    assert(status != ChangeStatus::Rejected &&
           "recovering from rejected name change is unimplemented");
  } else {
    Name = X;
  }
}
} // namespace gtirb

#endif // GTIRB_MODULE_H


================================================
FILE: include/gtirb/Node.hpp
================================================
//===- Node.hpp -------------------------------------------------*- C++ -*-===//
//
//  Copyright (C) 2020 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
#ifndef GTIRB_NODE_H
#define GTIRB_NODE_H

#include <gtirb/Casting.hpp>
#include <gtirb/Context.hpp>
#include <gtirb/Export.hpp>
#include <functional>
#include <string>

/// \file Node.hpp
/// \brief Class gtirb::Node.

namespace gtirb {
class Node;

/// \class Node
///
/// \brief Represents the base of the Node class hierarchy.
///
/// Objects of Node types can be converted into more specific types by
/// using the \ref casting "casting machinery" from Casting.hpp. You
/// can use static_cast<>() and reinterpret_cast<>(), but cast<>() and
/// dyn_cast<>() are safer alternatives. You cannot use dynamic_cast<>
/// to cast Node objects.
class GTIRB_EXPORT_API Node {
public:
  /// \cond internal

  // The enum constants below must be grouped according to the inheritance
  // hierarchy such that all descendants of a type X must appear between the
  // constant for X and LAST_X. This allows us to quickly check whether a type
  // is a descendant of X by checking if the enum constant falls in that range.
  enum class Kind {
    Node,
    CfgNode,
    CodeBlock,
    ProxyBlock,
    LAST_CfgNode = ProxyBlock, // Mark last descendant of CfgNode
    DataBlock,
    IR,
    Module,
    Section,
    Symbol,
    ByteInterval,
    LAST_Node = ByteInterval, // Mark last descendant of Node
  };
  /// \endcond

  /// \brief Retrieve a node by its UUID.
  ///
  /// \return The Node with the given UUID, or nullptr if none exists.
  static Node* getByUUID(Context& C, const UUID& Uuid) {
    return C.findNode(Uuid);
  }

  /// \brief Retrieve a node by its UUID.
  ///
  /// \return The Node with the given UUID, or nullptr if none exists.
  static const Node* getByUUID(const Context& C, const UUID& Uuid) {
    return C.findNode(Uuid);
  }

  /// \brief Create a Node object in its default state.
  ///
  /// \param C  The Context in which this object will be held.
  ///
  /// \return The newly created object.
  static Node* Create(Context& C) { return C.Create<Node>(C, Kind::Node); }

  /// \brief Copying Nodes is explicitly disabled.
  Node(const Node&) = delete;

  /// \brief Move-constructing Nodes is explicitly disabled.
  Node(Node&&) = delete;

  /// \brief Cleans up resources no longer needed by the Node object.
  ~Node() noexcept;

  /// \brief Copying Nodes is explicilty disabled.
  Node& operator=(const Node&) = delete;

  /// \brief Move-assigning Nodes is explicilty disabled.
  Node& operator=(Node&&) = delete;

  /// \brief Get the Universally Unique ID (UUID) for \c this.
  ///
  /// \return The UUID.
  const UUID& getUUID() const { return Uuid; }

  /// \cond INTERNAL
  Kind getKind() const { return K; }
  /// \endcond

  /// \cond INTERNAL
  static bool classof(const Node* N) { return classofKind(N->getKind()); }
  static bool classofKind(Kind K) {
    return K >= Kind::Node && K <= Kind::LAST_Node;
  }
  /// \endcond

protected:
  /// \cond INTERNAL
  Node(Context& C, Kind Knd);
  Node(Context& C, Kind Knd, const UUID& U);
  /// \endcond

private:
  Kind K;
  UUID Uuid;
  // The Context object can never be null as it can only be passed to the Node
  // constructor by reference. However, we don't want to store a reference to
  // the Context object because we want to keep the Node class copyable and
  // Context needs to own a move-only allocator.
  Context* Ctx;

  friend class Context; // Enables Context::Create
};

} // namespace gtirb

#endif // GTIRB_NODE_H


================================================
FILE: include/gtirb/Observer.hpp
================================================
//===- Observer.hpp ---------------------------------------------*- C++ -*-===//
//
//  Copyright (C) 2020 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
#ifndef GTIRB_OBSERVER_H
#define GTIRB_OBSERVER_H

namespace gtirb {
enum class ChangeStatus {
  Rejected, //< The requested change cannot be completed and must be rolled
            //< back.
  Accepted, //< The requested change was implemented successfully.
  NoChange  //< The requested change would not alter the data structure.
};
}

#endif // GTIRB_OBSERVER_H


================================================
FILE: include/gtirb/Offset.hpp
================================================
//===- Offset.hpp ------------------------------------------------*- C++-*-===//
//
//  Copyright (C) 2020 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
#ifndef GTIRB_OFFSET_H
#define GTIRB_OFFSET_H

#include <gtirb/Context.hpp>
#include <gtirb/Export.hpp>
#include <boost/functional/hash.hpp>
#include <cstdint>
#include <functional>

namespace gtirb {
namespace proto {
class Offset;
}

/// \class Offset
///
/// \brief Describes a location inside a node (byte interval, block, etc).
struct GTIRB_EXPORT_API Offset {
  /// \brief The UUID of the node.
  UUID ElementId;

  /// \brief The displacement from the start of the node, in bytes.
  uint64_t Displacement{0};

  /// \brief Constructor using a ElemId uuid and a Displacement.
  Offset(const UUID& ElemId, uint64_t Disp)
      : ElementId(ElemId), Displacement(Disp) {}

  /// \brief Default constructor.
  Offset() = default;

  /// \brief Equality operator for \ref Offset.
  // Note: boost::uuid is not constexpr.
  friend bool operator==(const Offset& LHS, const Offset& RHS) noexcept {
    return LHS.ElementId == RHS.ElementId &&
           LHS.Displacement == RHS.Displacement;
  }

  /// \brief Inequality operator for \ref Offset.
  friend bool operator!=(const Offset& LHS, const Offset& RHS) noexcept {
    return !operator==(LHS, RHS);
  }

  /// \brief Less-than operator for \ref Offset.
  friend constexpr bool operator<(const Offset& LHS,
                                  const Offset& RHS) noexcept {
    return std::tie(LHS.ElementId, LHS.Displacement) <
           std::tie(RHS.ElementId, RHS.Displacement);
  }

  /// \brief Greater-than operator for \ref Offset.
  friend constexpr bool operator>(const Offset& LHS,
                                  const Offset& RHS) noexcept {
    return operator<(RHS, LHS);
  }

  /// \brief Less-than-or-equal operator for \ref Offset.
  friend constexpr bool operator<=(const Offset& LHS,
                                   const Offset& RHS) noexcept {
    return !operator<(RHS, LHS);
  }

  /// \brief Greater-than-or-equal operator for \ref Offset.
  friend constexpr bool operator>=(const Offset& LHS,
                                   const Offset& RHS) noexcept {
    return !operator<(LHS, RHS);
  }

private:
  /// @cond INTERNAL
  /// \brief The protobuf message type used for serializing Offset.
  using MessageType = proto::Offset;

  /// \brief Serialize into a protobuf message.
  ///
  /// \param[out] Message   Serialize into this message.
  ///
  /// \return void
  void toProtobuf(MessageType* Message) const;

  /// \brief Construct a Offset from a protobuf message.
  ///
  /// \param C  The Context in which the deserialized Offset will be
  ///           held.
  /// \param Message  The protobuf message from which to deserialize.
  ///
  /// \return true if the \ref Offset could be deserialized, false otherwise.
  bool fromProtobuf(Context& C, const MessageType& Message);
  /// @endcond

  // Enables serialization.
  friend bool fromProtobuf(Context&, Offset&, const MessageType&);
};

} // namespace gtirb

namespace std {

/// \brief Hash operation for \ref Offset.
template <> struct hash<gtirb::Offset> {
  size_t operator()(const gtirb::Offset& X) const {
    std::size_t Seed = 0;
    boost::hash_combine(Seed, X.ElementId);
    boost::hash_combine(Seed, X.Displacement);
    return Seed;
  }
};

} // namespace std

#endif // GTIRB_OFFSET_H


================================================
FILE: include/gtirb/ProxyBlock.hpp
================================================
//===- ProxyBlock.hpp -------------------------------------------*- C++ -*-===//
//
//  Copyright (C) 2020 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
#ifndef GTIRB_PROX_BLOCK_H
#define GTIRB_PROX_BLOCK_H

#include <gtirb/CfgNode.hpp>
#include <gtirb/Node.hpp>

/// \file ProxyBlock.hpp
/// \ingroup CFG_GROUP
/// \brief Class gtirb::ProxyBlock.
/// \see CFG_GROUP

namespace gtirb {
namespace proto {
class ProxyBlock;
}

template <class T> class ErrorOr;
class Module;

/// \class ProxyBlock
///
/// \brief A placeholder that serves as the endpoint (source or target)
/// of a CFG edge.
///
/// ProxyBlock objects allow the construction of CFG edges to or from
/// another node. For example, a call to a function in another module
/// may be represented by an edge that originates at the calling
/// CodeBlock and targets a ProxyBlock. Another example would be an
/// edge that represents an indirect jump whose target is not known.
///
/// A ProxyBlock does not represent any instructions and so has neither
/// an address nor a size.
///
/// \see \ref CFG_GROUP
class GTIRB_EXPORT_API ProxyBlock : public CfgNode {
public:
  /// \brief Create an unitialized ProxyBlock object.
  /// \param C        The Context in which this ProxyBlock will be held.
  /// \return         The newly created ProxyBlock.
  static ProxyBlock* Create(Context& C) { return C.Create<ProxyBlock>(C); }

  /// \brief Get the \ref Module this block belongs to.
  Module* getModule() { return Parent; }
  /// \brief Get the \ref Module this block belongs to.
  const Module* getModule() const { return Parent; }

  static bool classof(const Node* N) {
    return N->getKind() == Kind::ProxyBlock;
  }
  /// @endcond

private:
  ProxyBlock(Context& C) : CfgNode(C, Kind::ProxyBlock) {}
  ProxyBlock(Context& C, const UUID& U) : CfgNode(C, Kind::ProxyBlock, U) {}

  static ProxyBlock* Create(Context& C, const UUID& U) {
    return C.Create<ProxyBlock>(C, U);
  }

  void setModule(Module* M) { Parent = M; }

  /// \brief The protobuf message type used for serializing Block.
  using MessageType = proto::ProxyBlock;

  /// \brief Serialize into a protobuf message.
  ///
  /// \param[out] Message   Serialize into this message.
  ///
  /// \return void
  void toProtobuf(MessageType* Message) const;

  /// \brief Construct a Block from a protobuf message.
  ///
  /// \param C  The Context in which the deserialized Block will be held.
  /// \param Message  The protobuf message from which to deserialize.
  ///
  /// \return The deserialized Block object, or null on failure.
  static ErrorOr<ProxyBlock*> fromProtobuf(Context& C,
                                           const MessageType& Message);

  // Present for testing purposes only.
  void save(std::ostream& Out) const;

  // Present for testing purposes only.
  static ProxyBlock* load(Context& C, std::istream& In);

  Module* Parent{nullptr};

  friend class Context; // Allow Context to construct proxies.
  friend class Module;  // Allow Module to call setModule, Create, etc.
  // Allows serializaton from Module via sequenceToProtobuf.
  template <typename T> friend typename T::MessageType toProtobuf(const T&);
  friend class SerializationTestHarness; // Testing support.
};

} // namespace gtirb

#endif // GTIRB_PROXY_BLOCK_H


================================================
FILE: include/gtirb/Section.hpp
================================================
//===- Section.hpp ----------------------------------------------*- C++ -*-===//
//
//  Copyright (C) 2020 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
#ifndef GTIRB_SECTION_H
#define GTIRB_SECTION_H

#include <gtirb/Addr.hpp>
#include <gtirb/ByteInterval.hpp>
#include <gtirb/CodeBlock.hpp>
#include <gtirb/DataBlock.hpp>
#include <gtirb/Node.hpp>
#include <gtirb/Observer.hpp>
#include <gtirb/Utility.hpp>
#include <gtirb/proto/Section.pb.h>
#include <algorithm>
#include <boost/icl/interval_map.hpp>
#include <boost/iterator/indirect_iterator.hpp>
#include <boost/iterator/iterator_traits.hpp>
#include <boost/multi_index/hashed_index.hpp>
#include <boost/multi_index/key_extractors.hpp>
#include <boost/multi_index/mem_fun.hpp>
#include <boost/multi_index/ordered_index.hpp>
#include <boost/range/iterator_range.hpp>
#include <cstdint>
#include <functional>
#include <set>

/// \file Section.hpp
/// \brief Class gtirb::Section.

namespace gtirb {
class Module; // Forward declared for the backpointer.
class SectionObserver;
template <typename T> class ErrorOr;

/// \enum SectionFlag
///
/// \brief Idenfities the flags used for a section.
enum class SectionFlag : uint8_t {
  Undefined = proto::SectionFlag::Section_Undefined,
  Readable = proto::SectionFlag::Readable,
  Writable = proto::SectionFlag::Writable,
  Executable = proto::SectionFlag::Executable,
  Loaded = proto::SectionFlag::Loaded,
  Initialized = proto::SectionFlag::Initialized,
  ThreadLocal = proto::SectionFlag::ThreadLocal,
};

/// \class Section
///
/// \brief Represents a named section of the binary.
///
/// Does not directly store the contents of the section, which are kept in
/// \ref ImageByteMap.
class GTIRB_EXPORT_API Section : public Node {
  Section(Context& C);
  Section(Context& C, const std::string& N);
  Section(Context& C, const std::string& N, const UUID& U);

  static Section* Create(Context& C, const std::string& Name, const UUID& U) {
    return C.Create<Section>(C, Name, U);
  }

  struct by_address {};
  struct by_pointer {};

  using ByteIntervalSet = boost::multi_index::multi_index_container<
      ByteInterval*,
      boost::multi_index::indexed_by<
          boost::multi_index::ordered_non_unique<
              boost::multi_index::tag<by_address>,
              boost::multi_index::identity<ByteInterval*>, AddressLess>,
          boost::multi_index::hashed_unique<
              boost::multi_index::tag<by_pointer>,
              boost::multi_index::identity<ByteInterval*>>>>;
  using ByteIntervalIntMap =
      boost::icl::interval_map<Addr, std::set<ByteInterval*, AddressLess>>;

  class ByteIntervalObserverImpl;

public:
  /// \brief Create an unitialized Section object.
  /// \param C        The Context in which this Section will be held.
  /// \return         The newly created Section.
  static Section* Create(Context& C) { return C.Create<Section>(C); }

  /// \brief Create a Section object.
  ///
  /// \param C        The Context in which this object will be held.
  /// \param Name     The name of the section.
  ///
  /// \return The newly created object.
  static Section* Create(Context& C, const std::string& Name) {
    return C.Create<Section>(C, Name);
  }

  /// \brief Equality operator overload.
  bool operator==(const Section& Other) const;

  /// \brief Inequality operator overload.
  bool operator!=(const Section& Other) const;

  /// \brief Get the \ref Module this section belongs to.
  Module* getModule() { return Parent; }
  /// \brief Get the \ref Module this section belongs to.
  const Module* getModule() const { return Parent; }

  /// \brief Get the name of a Section.
  ///
  /// \return The name.
  const std::string& getName() const { return Name; }

  /// \brief Adds the flag to the Section.
  ///
  /// \param F The flag to be added.
  void addFlag(SectionFlag F) { Flags.insert(F); }

  /// \brief Adds all of the flags to the Section.
  /// \tparam Fs A pack of \ref SectionFlag flags.
  /// \param F The flags to be added to the Section.
  template <typename... Fs> void addFlags(Fs... F) { (addFlag(F), ...); }

  /// \brief Removes the flag from the Section.
  ///
  /// \param F The flag to be removed.
  void removeFlag(SectionFlag F) { Flags.erase(F); }

  /// \brief Tests whether the given flag is set for the Section.
  ///
  /// \param F The flag to test.
  /// \return true if the flag is set, false otherwise.
  bool isFlagSet(SectionFlag F) const {
    return std::find(Flags.begin(), Flags.end(), F) != Flags.end();
  }

  /// \brief Iterator over \ref SectionFlag flags.
  using const_section_flag_iterator = std::set<SectionFlag>::const_iterator;
  /// \brief Range of \ref SectionFlag flags.
  using const_section_flag_range =
      boost::iterator_range<const_section_flag_iterator>;

  /// \brief Return a const iterator to the first \ref SectionFlag.
  const_section_flag_iterator flags_begin() const { return Flags.begin(); }
  /// \brief Return a const iterator to the element following the last \ref
  /// SectionFlag.
  const_section_flag_iterator flags_end() const { return Flags.end(); }
  /// \brief Return a range of the \ref SectionFlag flags set for the Section.
  const_section_flag_range flags() const {
    return boost::make_iterator_range(flags_begin(), flags_end());
  }

  /// \brief Iterator over \ref ByteInterval objects.
  using byte_interval_iterator =
      boost::indirect_iterator<ByteIntervalSet::iterator>;
  /// \brief Range of \ref ByteInterval objects.
  using byte_interval_range = boost::iterator_range<byte_interval_iterator>;
  /// \brief Sub-range of \ref ByteInterval objects overlapping addresses.
  using byte_interval_subrange = boost::iterator_range<
      boost::indirect_iterator<ByteIntervalIntMap::codomain_type::iterator>>;
  /// \brief Const iterator over \ref ByteInterval objects.
  using const_byte_interval_iterator =
      boost::indirect_iterator<ByteIntervalSet::const_iterator,
                               const ByteInterval>;
  /// \brief Const range of \ref ByteInterval objects.
  using const_byte_interval_range =
      boost::iterator_range<const_byte_interval_iterator>;
  /// \brief Const sub-range of \ref ByteInterval objects overlapping addresses.
  using const_byte_interval_subrange =
      boost::iterator_range<boost::indirect_iterator<
          ByteIntervalIntMap::codomain_type::const_iterator>>;

  /// \brief Return an iterator to the first \ref ByteInterval.
  byte_interval_iterator byte_intervals_begin() {
    return ByteIntervals.begin();
  }
  /// \brief Return a const iterator to the first \ref ByteInterval.
  const_byte_interval_iterator byte_intervals_begin() const {
    return ByteIntervals.begin();
  }
  /// \brief Return an iterator to the element following the last \ref
  /// ByteInterval.
  byte_interval_iterator byte_intervals_end() { return ByteIntervals.end(); }
  /// \brief Return a const iterator to the element following the last
  /// \ref ByteInterval.
  const_byte_interval_iterator byte_intervals_end() const {
    return ByteIntervals.end();
  }
  /// \brief Return a range of the \ref ByteInterval objects in this section.
  byte_interval_range byte_intervals() {
    return boost::make_iterator_range(byte_intervals_begin(),
                                      byte_intervals_end());
  }
  /// \brief Return a const range of the \ref ByteInterval objects in this
  /// section.
  const_byte_interval_range byte_intervals() const {
    return boost::make_iterator_range(byte_intervals_begin(),
                                      byte_intervals_end());
  }

  /// \brief Find all the intervals that have bytes that lie within the address
  /// specified.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref ByteInterval objects that intersect the address \p
  /// A.
  byte_interval_subrange findByteIntervalsOn(Addr A) {
    if (auto It = ByteIntervalAddrs.find(A); It != ByteIntervalAddrs.end()) {
      return boost::make_iterator_range(
          boost::make_indirect_iterator(It->second.begin()),
          boost::make_indirect_iterator(It->second.end()));
    }
    return {};
  }

  /// \brief Find all the intervals that have bytes that lie within the address
  /// specified.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref ByteInterval objects that intersect the address \p
  /// A.
  const_byte_interval_subrange findByteIntervalsOn(Addr A) const {
    if (auto It = ByteIntervalAddrs.find(A); It != ByteIntervalAddrs.end()) {
      return boost::make_iterator_range(
          boost::make_indirect_iterator(It->second.begin()),
          boost::make_indirect_iterator(It->second.end()));
    }
    return {};
  }

  /// \brief Find all the intervals that start at an address.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref ByteInterval objects that are at the address \p A.
  byte_interval_range findByteIntervalsAt(Addr A) {
    auto Pair = ByteIntervals.get<by_address>().equal_range(A);
    return boost::make_iterator_range(byte_interval_iterator(Pair.first),
                                      byte_interval_iterator(Pair.second));
  }

  /// \brief Find all the intervals that start between a range of addresses.
  ///
  /// \param Low  The low address, inclusive.
  /// \param High The high address, exclusive.
  ///
  /// \return A range of \ref ByteInterval objects that are between the
  /// addresses.
  byte_interval_range findByteIntervalsAt(Addr Low, Addr High) {
    auto& Index = ByteIntervals.get<by_address>();
    if (High < Low) {
      return boost::make_iterator_range(Index.end(), Index.end());
    }
    return boost::make_iterator_range(
        byte_interval_iterator(Index.lower_bound(Low)),
        byte_interval_iterator(Index.lower_bound(High)));
  }

  /// \brief Find all the intervals that start at an address.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref ByteInterval objects that are at the address \p A.
  const_byte_interval_range findByteIntervalsAt(Addr A) const {
    auto Pair = ByteIntervals.get<by_address>().equal_range(A);
    return boost::make_iterator_range(
        const_byte_interval_iterator(Pair.first),
        const_byte_interval_iterator(Pair.second));
  }

  /// \brief Find all the intervals that start between a range of addresses.
  ///
  /// \param Low  The low address, inclusive.
  /// \param High The high address, exclusive.
  ///
  /// \return A range of \ref ByteInterval objects that are between the
  /// addresses.
  const_byte_interval_range findByteIntervalsAt(Addr Low, Addr High) const {
    auto& Index = ByteIntervals.get<by_address>();
    if (High < Low) {
      return boost::make_iterator_range(Index.end(), Index.end());
    }
    return boost::make_iterator_range(
        const_byte_interval_iterator(Index.lower_bound(Low)),
        const_byte_interval_iterator(Index.lower_bound(High)));
  }

  /// \brief Return the address of this section, if known.
  ///
  /// The address is calculated from the \ref ByteInterval objects in this
  /// section. More specifically, if the address of all byte intervals in this
  /// section are fixed, then it will return the address of the interval lowest
  /// in memory. If any one interval does not have an address, then this
  /// function will return \ref std::nullopt, as the address is not calculable
  /// in that case. Note that a section with no intervals in it has no address
  /// or size, so it will return \ref std::nullopt in that case.
  std::optional<Addr> getAddress() const {
    if (Extent) {
      return Extent->lower();
    }
    return std::nullopt;
  }

  /// \brief Return the size of this section, if known.
  ///
  /// The size is calculated from the \ref ByteInterval objects in this section.
  /// More specifically, if the address of all byte intervals in this section
  /// are fixed, then it will return the difference between the lowest and
  /// highest address among the intervals. If any one interval does not have an
  /// address, then this function will return \ref std::nullopt, as the size is
  /// not calculable in that case. Note that a section with no intervals in it
  /// has no address or size, so it will return \ref std::nullopt in that case.
  std::optional<uint64_t> getSize() const {
    if (Extent) {
      return Extent->size();
    }
    return std::nullopt;
  }

  /// \brief Remove an interval from this section.
  ///
  /// \return Whether the operation succeeded (\c Accepted), no change was made
  /// (\c NoChange), or the operation could not be completed (\c Rejected). In
  /// particular, if the node to remove is not actually part of this node to
  /// begin with, the result will be \c NoChange.
  ChangeStatus removeByteInterval(ByteInterval* N);

  /// \brief Move an existing \ref ByteInterval to be a part of this section.
  ///
  /// \return a ChangeStatus indicating whether the insertion took place
  /// (\c Accepted), was unnecessary because this node already contained the
  /// ByteInterval (\c NoChange), or could not be completed (\c Rejected).
  ChangeStatus addByteInterval(ByteInterval* BI);

  /// \brief Creates a new \ref ByteInterval in this section.
  ///
  /// \tparam Args  The arguments to construct a \ref ByteInterval.
  /// \param  C     The Context in which this object will be held.
  /// \param  A     The arguments to construct a \ref ByteInterval.
  template <typename... Args>
  ByteInterval* addByteInterval(Context& C, Args&&... A) {
    ByteInterval* BI = ByteInterval::Create(C, std::forward<Args>(A)...);
    [[maybe_unused]] ChangeStatus status = addByteInterval(BI);
    // addByteInterval(ByteInterval*) does not currently reject any insertions
    // and the result cannot be NoChange because we just inserted a newly
    // created ByteInterval.
    assert(status == ChangeStatus::Accepted &&
           "unexpected result when inserting ByteInterval");
    return BI;
  }

  /// \brief Set this section's name.
  void setName(const std::string& N);

  /// \brief Iterator over blocks.
  ///
  /// Blocks are yielded in address order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".
  using block_iterator =
      MergeSortedIterator<ByteInterval::block_iterator, BlockAddressLess>;
  /// \brief Range of blocks.
  ///
  /// Blocks are yielded in address order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".
  using block_range = boost::iterator_range<block_iterator>;
  /// \brief Sub-range of blocks overlapping an address or range of addreses.
  ///
  /// Blocks are yielded in address order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".
  using block_subrange = boost::iterator_range<MergeSortedIterator<
      ByteInterval::block_subrange::iterator, BlockAddressLess>>;
  /// \brief Const iterator over blocks.
  ///
  /// Blocks are yielded in address order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".
  using const_block_iterator =
      MergeSortedIterator<ByteInterval::const_block_iterator, BlockAddressLess>;
  /// \brief Const range of blocks.
  ///
  /// Blocks are yielded in address order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".
  using const_block_range = boost::iterator_range<const_block_iterator>;
  /// \brief Const sub-range of blocks overlapping an address or range of
  /// addreses.
  ///
  /// Blocks are yielded in address order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".
  using const_block_subrange = boost::iterator_range<MergeSortedIterator<
      ByteInterval::const_block_subrange::iterator, BlockAddressLess>>;

  /// \brief Return an iterator to the first block.
  block_iterator blocks_begin() {
    return block_iterator(
        boost::make_transform_iterator(this->byte_intervals_begin(),
                                       NodeToBlockRange<ByteInterval>()),
        boost::make_transform_iterator(this->byte_intervals_end(),
                                       NodeToBlockRange<ByteInterval>()));
  }

  /// \brief Return an iterator to the element following the last block.
  block_iterator blocks_end() { return block_iterator(); }

  /// \brief Return a range of all the blocks.
  block_range blocks() {
    return boost::make_iterator_range(blocks_begin(), blocks_end());
  }

  /// \brief Return an iterator to the first block.
  const_block_iterator blocks_begin() const {
    return const_block_iterator(
        boost::make_transform_iterator(this->byte_intervals_begin(),
                                       NodeToBlockRange<const ByteInterval>()),
        boost::make_transform_iterator(this->byte_intervals_end(),
                                       NodeToBlockRange<const ByteInterval>()));
  }

  /// \brief Return an iterator to the element following the last block.
  const_block_iterator blocks_end() const { return const_block_iterator(); }

  /// \brief Return a range of all the blocks.
  const_block_range blocks() const {
    return boost::make_iterator_range(blocks_begin(), blocks_end());
  }

  /// \brief Find all the blocks that have bytes that lie within the address
  /// specified.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref Node objects, which are either \ref DataBlock
  /// objects or \ref CodeBlock objects, that intersect the address \p A.
  block_subrange findBlocksOn(Addr A) {
    byte_interval_subrange Intervals = findByteIntervalsOn(A);
    return block_subrange(
        block_subrange::iterator(
            boost::make_transform_iterator(Intervals.begin(),
                                           FindBlocksIn<ByteInterval>(A)),
            boost::make_transform_iterator(Intervals.end(),
                                           FindBlocksIn<ByteInterval>(A))),
        block_subrange::iterator());
  }

  /// \brief Find all the blocks that have bytes that lie within the address
  /// specified.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref Node objects, which are either \ref DataBlock
  /// objects or \ref CodeBlock objects, that intersect the address \p A.
  const_block_subrange findBlocksOn(Addr A) const {
    const_byte_interval_subrange Intervals = findByteIntervalsOn(A);
    return const_block_subrange(
        const_block_subrange::iterator(
            boost::make_transform_iterator(Intervals.begin(),
                                           FindBlocksIn<const ByteInterval>(A)),
            boost::make_transform_iterator(
                Intervals.end(), FindBlocksIn<const ByteInterval>(A))),
        const_block_subrange::iterator());
  }

  /// \brief Find all the blocks that start at an address.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref Node objects, which are either \ref DataBlock
  /// objects or \ref CodeBlock objects, that are at the address \p A.
  block_range findBlocksAt(Addr A) {
    byte_interval_subrange Intervals = findByteIntervalsOn(A);
    return block_range(
        block_range::iterator(
            boost::make_transform_iterator(Intervals.begin(),
                                           FindBlocksAt<ByteInterval>(A)),
            boost::make_transform_iterator(Intervals.end(),
                                           FindBlocksAt<ByteInterval>(A))),
        block_range::iterator());
  }

  /// \brief Find all the blocks that start between a range of addresses.
  ///
  /// \param Low  The low address, inclusive.
  /// \param High The high address, exclusive.
  ///
  /// \return A range of \ref Node objects, which are either \ref DataBlock
  /// objects or \ref CodeBlock objects, that are between the addresses.
  block_range findBlocksAt(Addr Low, Addr High) {
    std::vector<ByteInterval::block_range> Ranges;
    for (ByteInterval& BI : findByteIntervalsOn(Low))
      Ranges.push_back(BI.findBlocksAt(Low, High));
    for (ByteInterval& BI : findByteIntervalsAt(Low + 1, High))
      Ranges.push_back(BI.findBlocksAt(Low, High));
    return block_range(block_iterator(Ranges), block_iterator());
  }

  /// \brief Find all the blocks that start at an address.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref Node objects, which are either \ref DataBlock
  /// objects or \ref CodeBlock objects, that are at the address \p A.
  const_block_range findBlocksAt(Addr A) const {
    const_byte_interval_subrange Intervals = findByteIntervalsOn(A);
    return const_block_range(
        const_block_range::iterator(
            boost::make_transform_iterator(Intervals.begin(),
                                           FindBlocksAt<const ByteInterval>(A)),
            boost::make_transform_iterator(
                Intervals.end(), FindBlocksAt<const ByteInterval>(A))),
        const_block_range::iterator());
  }

  /// \brief Find all the blocks that start between a range of addresses.
  ///
  /// \param Low  The low address, inclusive.
  /// \param High The high address, exclusive.
  ///
  /// \return A range of \ref Node objects, which are either \ref DataBlock
  /// objects or \ref CodeBlock objects, that are between the addresses.
  const_block_range findBlocksAt(Addr Low, Addr High) const {
    std::vector<ByteInterval::const_block_range> Ranges;
    for (const ByteInterval& BI : findByteIntervalsOn(Low))
      Ranges.push_back(BI.findBlocksAt(Low, High));
    for (const ByteInterval& BI : findByteIntervalsAt(Low + 1, High))
      Ranges.push_back(BI.findBlocksAt(Low, High));
    return const_block_range(const_block_iterator(Ranges),
                             const_block_iterator());
  }

  /// \brief Iterator over \ref CodeBlock objects.
  ///
  /// Blocks are yielded in address order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".
  using code_block_iterator =
      MergeSortedIterator<ByteInterval::code_block_iterator, AddressLess>;
  /// \brief Range of \ref CodeBlock objects.
  ///
  /// Blocks are yielded in address order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".
  using code_block_range = boost::iterator_range<code_block_iterator>;
  /// \brief Sub-range of \ref CodeBlock objects overlapping an address or range
  /// of addreses.
  ///
  /// Blocks are yielded in address order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".
  using code_block_subrange = boost::iterator_range<MergeSortedIterator<
      ByteInterval::code_block_subrange::iterator, AddressLess>>;
  /// \brief Iterator over \ref CodeBlock objects.
  ///
  /// Blocks are yielded in address order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".
  using const_code_block_iterator =
      MergeSortedIterator<ByteInterval::const_code_block_iterator, AddressLess>;
  /// \brief Range of \ref CodeBlock objects.
  ///
  /// Blocks are yielded in address order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".
  using const_code_block_range =
      boost::iterator_range<const_code_block_iterator>;
  /// \brief Sub-range of \ref CodeBlock objects overlapping an address or range
  /// of addreses.
  ///
  /// Blocks are yielded in address order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".
  using const_code_block_subrange = boost::iterator_range<MergeSortedIterator<
      ByteInterval::const_code_block_subrange::iterator, AddressLess>>;

private:
  code_block_range makeCodeBlockRange(ByteIntervalSet::iterator Begin,
                                      ByteIntervalSet::iterator End) {
    NodeToCodeBlockRange<ByteInterval> Transformer;
    return boost::make_iterator_range(
        code_block_iterator(boost::make_transform_iterator(
                                byte_interval_iterator(Begin), Transformer),
                            boost::make_transform_iterator(
                                byte_interval_iterator(End), Transformer)),
        code_block_iterator());
  }

public:
  /// \brief Return an iterator to the first \ref CodeBlock.
  code_block_iterator code_blocks_begin() {
    return code_block_iterator(
        boost::make_transform_iterator(this->byte_intervals_begin(),
                                       NodeToCodeBlockRange<ByteInterval>()),
        boost::make_transform_iterator(this->byte_intervals_end(),
                                       NodeToCodeBlockRange<ByteInterval>()));
  }

  /// \brief Return an iterator to the element following the last \ref
  /// CodeBlock.
  code_block_iterator code_blocks_end() { return code_block_iterator(); }

  /// \brief Return a range of all the \ref CodeBlock objects.
  code_block_range code_blocks() {
    return boost::make_iterator_range(code_blocks_begin(), code_blocks_end());
  }

  /// \brief Return an iterator to the first \ref CodeBlock.
  const_code_block_iterator code_blocks_begin() const {
    return const_code_block_iterator(
        boost::make_transform_iterator(
            this->byte_intervals_begin(),
            NodeToCodeBlockRange<const ByteInterval>()),
        boost::make_transform_iterator(
            this->byte_intervals_end(),
            NodeToCodeBlockRange<const ByteInterval>()));
  }

  /// \brief Return an iterator to the element following the last \ref
  /// CodeBlock.
  const_code_block_iterator code_blocks_end() const {
    return const_code_block_iterator();
  }

  /// \brief Return a range of all the \ref CodeBlock objects.
  const_code_block_range code_blocks() const {
    return boost::make_iterator_range(code_blocks_begin(), code_blocks_end());
  }

  /// \brief Find all the code blocks that have bytes that lie within the
  /// address specified.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref CodeNode object that intersect the address \p A.
  code_block_subrange findCodeBlocksOn(Addr A) {
    byte_interval_subrange Intervals = findByteIntervalsOn(A);
    return code_block_subrange(
        code_block_subrange::iterator(
            boost::make_transform_iterator(Intervals.begin(),
                                           FindCodeBlocksIn<ByteInterval>(A)),
            boost::make_transform_iterator(Intervals.end(),
                                           FindCodeBlocksIn<ByteInterval>(A))),
        code_block_subrange::iterator());
  }

  /// \brief Find all the code blocks that have bytes that lie within the
  /// address specified.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref CodeBlock objects that intersect the address \p A.
  const_code_block_subrange findCodeBlocksOn(Addr A) const {
    const_byte_interval_subrange Intervals = findByteIntervalsOn(A);
    return const_code_block_subrange(
        const_code_block_subrange::iterator(
            boost::make_transform_iterator(
                Intervals.begin(), FindCodeBlocksIn<const ByteInterval>(A)),
            boost::make_transform_iterator(
                Intervals.end(), FindCodeBlocksIn<const ByteInterval>(A))),
        const_code_block_subrange::iterator());
  }

  /// \brief Find all the code blocks that start at an address.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref CodeBlock objects that are at the address \p A.
  code_block_range findCodeBlocksAt(Addr A) {
    byte_interval_subrange Intervals = findByteIntervalsOn(A);
    return code_block_range(
        code_block_range::iterator(
            boost::make_transform_iterator(Intervals.begin(),
                                           FindCodeBlocksAt<ByteInterval>(A)),
            boost::make_transform_iterator(Intervals.end(),
                                           FindCodeBlocksAt<ByteInterval>(A))),
        code_block_range::iterator());
  }

  /// \brief Find all the code blocks that start between a range of addresses.
  ///
  /// \param Low  The low address, inclusive.
  /// \param High The high address, exclusive.
  ///
  /// \return A range of \ref CodeBlock objects that are between the addresses.
  code_block_range findCodeBlocksAt(Addr Low, Addr High) {
    std::vector<ByteInterval::code_block_range> Ranges;
    for (ByteInterval& BI : findByteIntervalsOn(Low))
      Ranges.push_back(BI.findCodeBlocksAt(Low, High));
    for (ByteInterval& BI : findByteIntervalsAt(Low + 1, High))
      Ranges.push_back(BI.findCodeBlocksAt(Low, High));
    return code_block_range(code_block_iterator(Ranges), code_block_iterator());
  }

  /// \brief Find all the code blocks that start at an address.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref CodeBlock objects that are at the address \p A.
  const_code_block_range findCodeBlocksAt(Addr A) const {
    const_byte_interval_subrange Intervals = findByteIntervalsOn(A);
    return const_code_block_range(
        const_code_block_range::iterator(
            boost::make_transform_iterator(
                Intervals.begin(), FindCodeBlocksAt<const ByteInterval>(A)),
            boost::make_transform_iterator(
                Intervals.end(), FindCodeBlocksAt<const ByteInterval>(A))),
        const_code_block_range::iterator());
  }

  /// \brief Find all the code blocks that start between a range of addresses.
  ///
  /// \param Low  The low address, inclusive.
  /// \param High The high address, exclusive.
  ///
  /// \return A range of \ref CodeBlock objects that are between the addresses.
  const_code_block_range findCodeBlocksAt(Addr Low, Addr High) const {
    std::vector<ByteInterval::const_code_block_range> Ranges;
    for (const ByteInterval& BI : findByteIntervalsOn(Low))
      Ranges.push_back(BI.findCodeBlocksAt(Low, High));
    for (const ByteInterval& BI : findByteIntervalsAt(Low + 1, High))
      Ranges.push_back(BI.findCodeBlocksAt(Low, High));
    return const_code_block_range(const_code_block_iterator(Ranges),
                                  const_code_block_iterator());
  }

  /// \brief Iterator over \ref DataBlock objects.
  ///
  /// Blocks are yielded in address order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".
  using data_block_iterator =
      MergeSortedIterator<ByteInterval::data_block_iterator, AddressLess>;
  /// \brief Range of \ref DataBlock objects.
  ///
  /// Blocks are yielded in address order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".
  using data_block_range = boost::iterator_range<data_block_iterator>;
  /// \brief Sub-range of \ref DataBlock objects overlapping an address or range
  /// of addreses.
  ///
  /// Blocks are yielded in address order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".
  using data_block_subrange = boost::iterator_range<MergeSortedIterator<
      ByteInterval::data_block_subrange::iterator, AddressLess>>;
  /// \brief Iterator over \ref DataBlock objects.
  ///
  /// Blocks are yielded in address order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".
  using const_data_block_iterator =
      MergeSortedIterator<ByteInterval::const_data_block_iterator, AddressLess>;
  /// \brief Range of \ref DataBlock objects.
  ///
  /// Blocks are yielded in address order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".
  using const_data_block_range =
      boost::iterator_range<const_data_block_iterator>;
  /// \brief Sub-range of \ref DataBlock objects overlapping an address or range
  /// of addreses.
  ///
  /// Blocks are yielded in address order, ascending. For more details, see
  /// \ref iteration_order "the documentation on iteration order".
  using const_data_block_subrange = boost::iterator_range<MergeSortedIterator<
      ByteInterval::const_data_block_subrange::iterator, AddressLess>>;

  /// \brief Return an iterator to the first \ref DataBlock.
  data_block_iterator data_blocks_begin() {
    return data_block_iterator(
        boost::make_transform_iterator(this->byte_intervals_begin(),
                                       NodeToDataBlockRange<ByteInterval>()),
        boost::make_transform_iterator(this->byte_intervals_end(),
                                       NodeToDataBlockRange<ByteInterval>()));
  }

  /// \brief Return an iterator to the element following the last \ref
  /// DataBlock.
  data_block_iterator data_blocks_end() { return data_block_iterator(); }

  /// \brief Return a range of all the \ref DataBlock objects.
  data_block_range data_blocks() {
    return boost::make_iterator_range(data_blocks_begin(), data_blocks_end());
  }

  /// \brief Return an iterator to the first \ref DataBlock.
  const_data_block_iterator data_blocks_begin() const {
    return const_data_block_iterator(
        boost::make_transform_iterator(
            this->byte_intervals_begin(),
            NodeToDataBlockRange<const ByteInterval>()),
        boost::make_transform_iterator(
            this->byte_intervals_end(),
            NodeToDataBlockRange<const ByteInterval>()));
  }

  /// \brief Return an iterator to the element following the last \ref
  /// DataBlock.
  const_data_block_iterator data_blocks_end() const {
    return const_data_block_iterator();
  }

  /// \brief Return a range of all the \ref DataBlock objects.
  const_data_block_range data_blocks() const {
    return boost::make_iterator_range(data_blocks_begin(), data_blocks_end());
  }

  /// \brief Find all the data blocks that have bytes that lie within the
  /// address specified.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref DataNode object that intersect the address \p A.
  data_block_subrange findDataBlocksOn(Addr A) {
    byte_interval_subrange Intervals = findByteIntervalsOn(A);
    return data_block_subrange(
        data_block_subrange::iterator(
            boost::make_transform_iterator(Intervals.begin(),
                                           FindDataBlocksIn<ByteInterval>(A)),
            boost::make_transform_iterator(Intervals.end(),
                                           FindDataBlocksIn<ByteInterval>(A))),
        data_block_subrange::iterator());
  }

  /// \brief Find all the data blocks that have bytes that lie within the
  /// address specified.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref DataBlock objects that intersect the address \p A.
  const_data_block_subrange findDataBlocksOn(Addr A) const {
    const_byte_interval_subrange Intervals = findByteIntervalsOn(A);
    return const_data_block_subrange(
        const_data_block_subrange::iterator(
            boost::make_transform_iterator(
                Intervals.begin(), FindDataBlocksIn<const ByteInterval>(A)),
            boost::make_transform_iterator(
                Intervals.end(), FindDataBlocksIn<const ByteInterval>(A))),
        const_data_block_subrange::iterator());
  }

  /// \brief Find all the data blocks that start at an address.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref DataBlock objects that are at the address \p A.
  data_block_range findDataBlocksAt(Addr A) {
    byte_interval_subrange Intervals = findByteIntervalsOn(A);
    return data_block_range(
        data_block_range::iterator(
            boost::make_transform_iterator(Intervals.begin(),
                                           FindDataBlocksAt<ByteInterval>(A)),
            boost::make_transform_iterator(Intervals.end(),
                                           FindDataBlocksAt<ByteInterval>(A))),
        data_block_range::iterator());
  }

  /// \brief Find all the data blocks that start between a range of addresses.
  ///
  /// \param Low  The low address, inclusive.
  /// \param High The high address, exclusive.
  ///
  /// \return A range of \ref DataBlock objects that are between the addresses.
  data_block_range findDataBlocksAt(Addr Low, Addr High) {
    std::vector<ByteInterval::data_block_range> Ranges;
    for (ByteInterval& BI : findByteIntervalsOn(Low))
      Ranges.push_back(BI.findDataBlocksAt(Low, High));
    for (ByteInterval& BI : findByteIntervalsAt(Low + 1, High))
      Ranges.push_back(BI.findDataBlocksAt(Low, High));
    return data_block_range(data_block_iterator(Ranges), data_block_iterator());
  }

  /// \brief Find all the data blocks that start at an address.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref DataBlock objects that are at the address \p A.
  const_data_block_range findDataBlocksAt(Addr A) const {
    const_byte_interval_subrange Intervals = findByteIntervalsOn(A);
    return const_data_block_range(
        const_data_block_range::iterator(
            boost::make_transform_iterator(
                Intervals.begin(), FindDataBlocksAt<const ByteInterval>(A)),
            boost::make_transform_iterator(
                Intervals.end(), FindDataBlocksAt<const ByteInterval>(A))),
        const_data_block_range::iterator());
  }

  /// \brief Find all the data blocks that start between a range of addresses.
  ///
  /// \param Low  The low address, inclusive.
  /// \param High The high address, exclusive.
  ///
  /// \return A range of \ref DataBlock objects that are between the addresses.
  const_data_block_range findDataBlocksAt(Addr Low, Addr High) const {
    std::vector<ByteInterval::const_data_block_range> Ranges;
    for (const ByteInterval& BI : findByteIntervalsOn(Low))
      Ranges.push_back(BI.findDataBlocksAt(Low, High));
    for (const ByteInterval& BI : findByteIntervalsAt(Low + 1, High))
      Ranges.push_back(BI.findDataBlocksAt(Low, High));
    return const_data_block_range(const_data_block_iterator(Ranges),
                                  const_data_block_iterator());
  }

  /// \brief Iterator over \ref SymbolicExpressionElement objects.
  ///
  /// Results are yielded in address order, ascending.
  using symbolic_expression_iterator =
      MergeSortedIterator<ByteInterval::symbolic_expression_iterator,
                          ByteInterval::SymbolicExpressionElement::AddressLess>;
  /// \brief Range of \ref SymbolicExpressionElement objects.
  ///
  /// Results are yielded in address order, ascending.
  using symbolic_expression_range =
      boost::iterator_range<symbolic_expression_iterator>;
  /// \brief Iterator over \ref SymbolicExpressionElement objects.
  ///
  /// Results are yielded in address order, ascending.
  using const_symbolic_expression_iterator = MergeSortedIterator<
      ByteInterval::const_symbolic_expression_iterator,
      ByteInterval::ConstSymbolicExpressionElement::AddressLess>;
  /// \brief Range of \ref SymbolicExpressionElement objects.
  ///
  /// Results are yielded in address order, ascending.
  using const_symbolic_expression_range =
      boost::iterator_range<const_symbolic_expression_iterator>;

  /// \brief Return an iterator to the first \ref SymbolicExpression.
  symbolic_expression_iterator symbolic_expressions_begin() {
    return symbolic_expression_iterator(
        boost::make_transform_iterator(
            this->byte_intervals_begin(),
            NodeToSymbolicExpressionRange<ByteInterval>()),
        boost::make_transform_iterator(
            this->byte_intervals_end(),
            NodeToSymbolicExpressionRange<ByteInterval>()));
  }

  /// \brief Return an iterator to the element following the last \ref
  /// SymbolicExpression.
  symbolic_expression_iterator symbolic_expressions_end() {
    return symbolic_expression_iterator();
  }

  /// \brief Return a range of all the \ref SymbolicExpression objects.
  symbolic_expression_range symbolic_expressions() {
    return boost::make_iterator_range(symbolic_expressions_begin(),
                                      symbolic_expressions_end());
  }

  /// \brief Return an iterator to the first \ref SymbolicExpression.
  const_symbolic_expression_iterator symbolic_expressions_begin() const {
    return const_symbolic_expression_iterator(
        boost::make_transform_iterator(
            this->byte_intervals_begin(),
            NodeToSymbolicExpressionRange<const ByteInterval>()),
        boost::make_transform_iterator(
            this->byte_intervals_end(),
            NodeToSymbolicExpressionRange<const ByteInterval>()));
  }

  /// \brief Return an iterator to the element following the last \ref
  /// SymbolicExpression.
  const_symbolic_expression_iterator symbolic_expressions_end() const {
    return const_symbolic_expression_iterator();
  }

  /// \brief Return a range of all the \ref SymbolicExpression objects.
  const_symbolic_expression_range symbolic_expressions() const {
    return boost::make_iterator_range(symbolic_expressions_begin(),
                                      symbolic_expressions_end());
  }

  /// \brief Find all the symbolic expressions that start at an address.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref SymbolicExpression objects that are at the address
  /// \p A.
  symbolic_expression_range findSymbolicExpressionsAt(Addr A) {
    return symbolic_expression_range(
        symbolic_expression_range::iterator(
            boost::make_transform_iterator(this->byte_intervals_begin(),
                                           FindSymExprsAt<ByteInterval>(A)),
            boost::make_transform_iterator(this->byte_intervals_end(),
                                           FindSymExprsAt<ByteInterval>(A))),
        symbolic_expression_range::iterator());
  }

  /// \brief Find all the symbolic expressions that start between a range of
  /// addresses.
  ///
  /// \param Low  The low address, inclusive.
  /// \param High The high address, exclusive.
  ///
  /// \return A range of \ref SymbolicExpression objects that are between the
  /// addresses.
  symbolic_expression_range findSymbolicExpressionsAt(Addr Low, Addr High) {
    return symbolic_expression_range(
        symbolic_expression_range::iterator(
            boost::make_transform_iterator(
                this->byte_intervals_begin(),
                FindSymExprsBetween<ByteInterval>(Low, High)),
            boost::make_transform_iterator(
                this->byte_intervals_end(),
                FindSymExprsBetween<ByteInterval>(Low, High))),
        symbolic_expression_range::iterator());
  }

  /// \brief Find all the symbolic expressions that start at an address.
  ///
  /// \param A The address to look up.
  ///
  /// \return A range of \ref SymbolicExpression objects that are at the address
  /// \p A.
  const_symbolic_expression_range findSymbolicExpressionsAt(Addr A) const {
    return const_symbolic_expression_range(
        const_symbolic_expression_range::iterator(
            boost::make_transform_iterator(
                this->byte_intervals_begin(),
                FindSymExprsAt<const ByteInterval>(A)),
            boost::make_transform_iterator(
                this->byte_intervals_end(),
                FindSymExprsAt<const ByteInterval>(A))),
        const_symbolic_expression_range::iterator());
  }

  /// \brief Find all the symbolic expressions that start between a range of
  /// addresses.
  ///
  /// \param Low  The low address, inclusive.
  /// \param High The high address, exclusive.
  ///
  /// \return A range of \ref SymbolicExpression objects that are between the
  /// addresses.
  const_symbolic_expression_range findSymbolicExpressionsAt(Addr Low,
                                                            Addr High) const {
    return const_symbolic_expression_range(
        const_symbolic_expression_range::iterator(
            boost::make_transform_iterator(
                this->byte_intervals_begin(),
                FindSymExprsBetween<const ByteInterval>(Low, High)),
            boost::make_transform_iterator(
                this->byte_intervals_end(),
                FindSymExprsBetween<const ByteInterval>(Low, High))),
        const_symbolic_expression_range::iterator());
  }

  /// @cond INTERNAL
  static bool classof(const Node* N) { return N->getKind() == Kind::Section; }
  /// @endcond

private:
  Module* Parent{nullptr};
  SectionObserver* Observer{nullptr};
  std::string Name;
  ByteIntervalSet ByteIntervals;
  ByteIntervalIntMap ByteIntervalAddrs;
  std::optional<AddrRange> Extent;
  std::set<SectionFlag> Flags;

  std::unique_ptr<ByteIntervalObserver> BIO;

  /// \brief Remove a ByteInterval from ByteIntervalAddrs.
  void removeByteIntervalAddrs(ByteInterval* BI);

  /// \brief Add a ByteInterval to ByteIntervalAddrs.
  ///
  /// The caller is responsible for ensuring that the ByteInterval is owned
  /// by this Section.
  void insertByteIntervalAddrs(ByteInterval* BI);

  /// \brief Update the extent after adding/removing a ByteInterval.
  ChangeStatus updateExtent();

  void setParent(Module* M, SectionObserver* O) {
    Parent = M;
    Observer = O;
  }

  /// \brief The protobuf message type used for serializing Section.
  using MessageType = proto::Section;

  /// \brief Serialize into a protobuf message.
  ///
  /// \param[out] Message   Serialize into this message.
  ///
  /// \return void
  void toProtobuf(MessageType* Message) const;

  /// \brief Construct a Section from a protobuf message.
  ///
  /// \param C   The Context in which the deserialized Section will be held.
  /// \param Message  The protobuf message from which to deserialize.
  ///
  /// \return The deserialized Section object, or null on failure.
  static ErrorOr<Section*> fromProtobuf(Context& C, const MessageType& Message);

  // Present for testing purposes only.
  void save(std::ostream& Out) const;

  // Present for testing purposes only.
  static Section* load(Context& C, std::istream& In);

  friend class Context; // Allow Context to construct sections.
  friend class Module;  // Allow Module to call setModule, Create, etc.
  // Allows serializaton from Module via sequenceToProtobuf.
  template <typename T> friend typename T::MessageType toProtobuf(const T&);
  friend class SerializationTestHarness; // Testing support.
};

/// \class SectionObserver
///
/// \brief Interface for notifying observers when the Section is modified.
///

class GTIRB_EXPORT_API SectionObserver {
public:
  virtual ~SectionObserver() = default;

  /// \brief Notify the parent when this Section's name changes.
  ///
  /// Called after the Section updates its internal state.
  ///
  /// \param S        the Section whose name changed.
  /// \param OldName  the Section's previous name.
  /// \param NewName  the new name of this section.
  ///
  /// \return indication of whether the observer accepts the change.
  virtual ChangeStatus nameChange(Section* S, const std::string& OldName,
                                  const std::string& NewName) = 0;

  /// \brief Notify the parent when new CodeBlocks are added to the Section.
  ///
  /// Called after the Section updates its internal state.
  ///
  /// \param S       the Section to which CodeBlocks were added.
  /// \param Blocks  a range containing the new CodeBlocks.
  ///
  /// \return indication of whether the observer accepts the change.
  virtual ChangeStatus addCodeBlocks(Section* S,
                                     Section::code_block_range Blocks) = 0;

  /// \brief Notify the parent when the addresses of existing CodeBlocks change.
  ///
  /// Called after the Section updates its internal state.
  ///
  /// \param S       the Section containing the CodeBlocks.
  /// \param Blocks  a range containing the CodeBlocks that moved.
  ///
  /// \return indication of whether the observer accepts the change.
  virtual ChangeStatus moveCodeBlocks(Section* S,
                                      Section::code_block_range Blocks) = 0;

  /// \brief Notify the parent when CodeBlocks are removed from the Section.
  ///
  /// Called before the Section updates its internal state.
  ///
  /// \param S       the Section from which CodeBlocks will be removed.
  /// \param Blocks  a range containing the CodeBlocks to remove.
  ///
  /// \return indication of whether the observer accepts the change.
  virtual ChangeStatus removeCodeBlocks(Section* S,
                                        Section::code_block_range Blocks) = 0;

  /// \brief Notify the parent when new DataBlocks are added to the Section.
  ///
  /// Called after the Section updates its internal state.
  ///
  /// \param S       the Section to which DataBlocks were added.
  /// \param Blocks  a range containing the new DataBlocks.
  ///
  /// \return indication of whether the observer accepts the change.
  virtual ChangeStatus addDataBlocks(Section* S,
                                     Section::data_block_range Blocks) = 0;

  /// \brief Notify the parent when the addresses of existing DataBlocks change.
  ///
  /// Called after the Section updates its internal state.
  ///
  /// \param S       the Section containing the DataBlocks.
  /// \param Blocks  a range containing the DataBlocks that moved.
  ///
  /// \return indication of whether the observer accepts the change.
  virtual ChangeStatus moveDataBlocks(Section* S,
                                      Section::data_block_range Blocks) = 0;

  /// \brief Notify the parent when DataBlocks are removed from the Section.
  ///
  /// Called before the Section updates its internal state.
  ///
  /// \param S       the Section from which DataBlocks will be removed.
  /// \param Blocks  a range containing the DataBlocks to remove.
  ///
  /// \return indication of whether the observer accepts the change.
  virtual ChangeStatus removeDataBlocks(Section* S,
                                        Section::data_block_range Blocks) = 0;

  /// \brief Notify parent when the range of addresses in the Section changes.
  ///
  /// Called before the Section's extent changes. This method should invoke the
  /// callback with \p S to update its extent.
  ///
  /// \param S         the Section that changed.
  /// \param Callback  callable to update the ByteInterval's extent.
  ///
  /// \return indication of whether the observer accepts the change.
  virtual ChangeStatus changeExtent(Section* S,
                                    std::function<void(Section*)> Callback) = 0;
};

inline void Section::setName(const std::string& X) {
  if (Observer) {
    std::string OldName = X;
    std::swap(Name, OldName);
    [[maybe_unused]] ChangeStatus status =
        Observer->nameChange(this, OldName, Name);
    // The known observers do not reject insertions. If that changes, this
    // method must be updated.
    assert(status != ChangeStatus::Rejected &&
           "recovering from rejected name change is unimplemented");
  } else {
    Name = X;
  }
}
} // namespace gtirb

#endif // GTIRB_SECTION_H


================================================
FILE: include/gtirb/Symbol.hpp
================================================
//===- Symbol.hpp -----------------------------------------------*- C++ -*-===//
//
//  Copyright (C) 2020 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
#ifndef GTIRB_SYMBOL_H
#define GTIRB_SYMBOL_H

#include <gtirb/Addr.hpp>
#include <gtirb/CodeBlock.hpp>
#include <gtirb/DataBlock.hpp>
#include <gtirb/Node.hpp>
#include <gtirb/ProxyBlock.hpp>
#include <functional>
#include <optional>
#include <type_traits>
#include <variant>

/// \file Symbol.hpp
/// \brief Class gtirb::Symbol.

namespace gtirb {
namespace proto {
class Symbol;
}

template <class T> class ErrorOr;
class Module; // Forward declared for the backpointer.
class SymbolObserver;

/// \class Symbol
///
/// \brief Represents a Symbol, which maps a name to an object in the IR.
class GTIRB_EXPORT_API Symbol : public Node {
  template <typename... Ts> struct TypeList {};

  // SFINAE overload handling a Callable with a void return type.
  template <typename Callable, typename Ty, typename CommonRetTy>
  auto visit_impl_help(Callable&& Visitor) const
      -> std::enable_if_t<std::is_void_v<CommonRetTy>, bool> {
    static_assert(std::is_invocable_v<Callable, Ty*>,
                  "Visitor must contain an overloaded function call operator "
                  "for each of the types in supported_types");
    if (Node* const* Ptr = std::get_if<Node*>(&Payload)) {
      if (Ty* Obj = dyn_cast_or_null<Ty>(*Ptr)) {
        std::invoke(Visitor, Obj);
        return true;
      }
    }
    return false;
  }

  // SFINAE overload handling a Callable with a non-void return type.
  template <typename Callable, typename Ty, typename CommonRetTy>
  bool
  visit_impl_help(Callable&& Visitor,
                  std::enable_if_t<!std::is_void_v<CommonRetTy>,
                                   std::optional<CommonRetTy>>& Ret) const {
    static_assert(std::is_invocable_v<Callable, Ty*>,
                  "Visitor must contain an overloaded function call operator "
                  "for each of the types in supported_types");
    if (Node* const* Ptr = std::get_if<Node*>(&Payload)) {
      if (Ty* Obj = dyn_cast_or_null<Ty>(*Ptr)) {
        Ret = std::invoke(Visitor, Obj);
        return true;
      }
    }
    return false;
  }

  // Helper type traits used to determine whether all of the Callable object's
  // return types agree. Note that the return types do not need to be the same,
  // but do need to be implicitly convertible to the same common type. e.g.,
  // this class is a valid Callable.
  //   struct Visitor {
  //     int operator()(Block*);
  //     long operator()(DataBlock*);
  //  };
  template <typename AlwaysVoid, typename Callable,
            template <typename...> typename TypeList, typename... Types>
  struct common_return_type_impl : std::false_type {};

  template <typename Callable, template <typename...> typename TypeList,
            typename... Types>
  struct common_return_type_impl<
      std::void_t<
          std::common_type_t<std::invoke_result_t<Callable, Types*>...>>,
      Callable, TypeList, Types...> : std::true_type {
    using type = std::common_type_t<std::invoke_result_t<Callable, Types*>...>;
  };

  template <typename Callable, template <typename...> typename TypeList,
            typename... Types>
  using common_return_type_t =
      typename common_return_type_impl<void, Callable, TypeList,
                                       Types...>::type;

  template <typename Callable, template <typename...> typename TypeList,
            typename... Types>
  static constexpr bool common_return_type_v =
      common_return_type_impl<void, Callable, TypeList, Types...>::value;

  // Helper function to unpack all of the types in the type list and attempt to
  // visit Callable once per type. Verifies that the Callable objects all share
  // a compatible return type.
  //
  // SFINAE overload handling a Callable where there is a common, non-void
  // return type. Returns a std::optional<common_type>.
  template <typename Callable, template <typename...> typename TypeList,
            typename... Types>
  auto visit_impl(Callable&& Visitor, TypeList<Types...>) const
      -> std::enable_if_t<
          !std::is_void_v<common_return_type_t<Callable, TypeList, Types...>>,
          std::optional<common_return_type_t<Callable, TypeList, Types...>>> {
    // If this assertion fails, the return values from the Callable object are
    // not compatible enough. This can happen if they return incompatible types
    // or if there is not an overload for each referent type.
    static_assert(common_return_type_v<Callable, TypeList, Types...>,
                  "incompatible return types for the Callable object");
    // Instantiate a call to the Visitor once for each of the listed types, but
    // only issue the call at runtime if the Referent can be dynamically cast to
    // the given type. In this way, the Visitor needs to be able to handle any
    // of the supported types, but will only be called once for the concrete
    // type of the Referent.
    //
    // If you get an error about there being no matching overloaded function for
    // the call to visit_impl_help, that is most likely because there are one
    // or more overloads missing for each referent type.
    std::optional<common_return_type_t<Callable, TypeList, Types...>> Res;
    (... ||
     visit_impl_help<Callable, Types, typename decltype(Res)::value_type>(
         std::forward<Callable>(Visitor), Res));
    return Res;
  }

  // SFINAE overload handling a Callable where every return type is void.
  // Returns void.
  template <typename Callable, template <typename...> typename TypeList,
            typename... Types>
  auto visit_impl(Callable&& Visitor, TypeList<Types...>) const
      -> std::enable_if_t<
          std::is_void_v<common_return_type_t<Callable, TypeList, Types...>>,
          void> {
    // Call each of the overloads on Callable, but there is no value to be
    // returned from any of the calls.
    (... ||
     visit_impl_help<Callable, Types, void>(std::forward<Callable>(Visitor)));
  }

  // Helper function that determines whether the passed NodeTy is the same as
  // any of the types in the Types... list.
  template <typename NodeTy, template <typename...> typename TypeList,
            typename... Types>
  static constexpr bool is_supported_type_impl(TypeList<Types...>) {
    return (... || std::is_same_v<NodeTy, Types>);
  }

public:
  // Helper function that determines whether the passed NodeTy is one of the
  // supported referent types.
  template <typename NodeTy> static constexpr bool is_supported_type() {
    return is_supported_type_impl<NodeTy>(
        std::decay_t<supported_referent_types>{});
  }

  /// \brief The list of supported referent types.
  using supported_referent_types = TypeList<CodeBlock, DataBlock, ProxyBlock>;

  /// \brief Visits the symbol's referent, if one is present, by concrete
  /// referent type.
  ///
  /// \tparam Callable  A callable function type. This type must be able to be
  /// called with a pointer to all of the types listed in \ref
  /// supported_referent_types. All overloaded functions must have a common,
  /// compatible return type.
  ///
  /// \param Visitor  A callable object that will be called with a nonnull
  /// symbol referent.
  ///
  /// \return The common type of each of the return types in the \p Callable
  /// overload set. Notionally returns:
  /// std::common_type_t<Overload1(Ty1), Overload2(Ty2), ...>
  /// which can be void.
  ///
  /// For example:
  ///
  /// \code
  /// struct Visitor {
  ///   int operator()(CfgNode*) { return 0; }
  ///   long operator()(DataBlock*) { return 1; }
  /// };
  ///
  /// Context Ctx;
  /// Symbol* SymB = Symbol::Create(Ctx, Block::Create(Ctx), "");
  /// Symbol* SymD = Symbol::Create(Ctx, DataBlock::Create(Ctx), "");
  /// Symbol* SymX = Symbol::Create(Ctx, Addr(42), "");
  /// Symbol* SymN = Symbol::Create(Ctx);
  ///
  /// SymB->visit(Visitor{}); // Will call Visitor::operator()(CfgNode*);
  /// SymD->visit(Visitor{}); // Will call Visitor::operator()(DataBlock*);
  /// SymX->visit(Visitor{}); // Will not call any overload
  /// SymN->visit(Visitor{}); // Will not call any overload
  /// \endcode
  template <typename Callable> auto visit(Callable&& Visitor) const {
    return visit_impl(std::forward<Callable>(Visitor),
                      std::decay_t<supported_referent_types>{});
  }

  /// \brief Create an unitialized Symbol object.
  /// \param C        The Context in which this Symbol will be held.
  /// \return         The newly created Symbol.
  static Symbol* Create(Context& C) { return C.Create<Symbol>(C); }

  /// \brief Create a Symbol object.
  ///
  /// \param C      The Context in which this object will be held.
  /// \param Name   The name of the symbol.
  /// \param AtEnd  If true, this symbol points to the end of its referent,
  ///               rather than at the beginning. Defaults to false.
  ///
  /// \return The newly created object.
  static Symbol* Create(Context& C, const std::string& Name,
                        bool AtEnd = false) {
    return C.Create<Symbol>(C, Name, AtEnd);
  }

  /// \brief Create a Symbol object.
  ///
  /// \param C      The Context in which this object will be held.
  /// \param X      The address of the symbol.
  /// \param Name   The name of the symbol.
  /// \param AtEnd  If true, this symbol points to the end of its referent,
  ///               rather than at the beginning. Defaults to false.
  ///
  /// \return The newly created object.
  static Symbol* Create(Context& C, Addr X, const std::string& Name,
                        bool AtEnd = false) {
    return C.Create<Symbol>(C, X, Name, AtEnd);
  }

  /// \brief Create a Symbol object.
  ///
  /// \param C        The Context in which this object will be held.
  /// \param Referent The DataBlock this symbol refers to.
  /// \param Name     The name of the symbol.
  /// \param AtEnd  If true, this symbol points to the end of its referent,
  ///               rather than at the beginning. Defaults to false.
  ///
  /// \return The newly created object.
  template <typename NodeTy>
  static Symbol* Create(Context& C, NodeTy* Referent, const std::string& Name,
                        bool AtEnd = false) {
    static_assert(is_supported_type<NodeTy>(), "unsupported referent type");
    return C.Create<Symbol>(C, Referent, Name, AtEnd);
  }

  /// \brief Get the \ref Module this symbol belongs to.
  Module* getModule() { return Parent; }
  /// \brief Get the \ref Module this symbol belongs to.
  const Module* getModule() const { return Parent; }

  /// \brief Get the effective address.
  ///
  /// \return The effective address.
  std::optional<Addr> getAddress() const;

  /// \brief Get the name.
  ///
  /// \return The name.
  const std::string& getName() const { return Name; }

  /// \brief Get the referent to which this symbol refers.
  ///
  /// \tparam NodeTy A Node type of a supported referent.
  ///
  /// \return The data, dynamically typed as the given \p NodeTy, or
  /// null if there is no referent of that type.
  template <typename NodeTy> NodeTy* getReferent() {
    if (Node* const* Ptr = std::get_if<Node*>(&Payload))
      return dyn_cast_or_null<NodeTy>(*Ptr);
    return nullptr;
  }

  /// \brief Get the referent to which this symbol refers.
  ///
  /// \tparam NodeTy A Node type of a supported referent.
  ///
  /// \return The data, dynamically typed as the given \p NodeTy, or
  /// null if there is no referent of that type.
  template <typename NodeTy> const NodeTy* getReferent() const {
    if (Node* const* Ptr = std::get_if<Node*>(&Payload))
      return dyn_cast_or_null<NodeTy>(*Ptr);
    return nullptr;
  }

  /// \brief Check if this symbol has a referent.
  ///
  /// \return \p true if the symbol has a referent, \p false otherwise.
  bool hasReferent() const { return std::holds_alternative<Node*>(Payload); }

  /// \brief Set the name of a symbol.
  void setName(const std::string& N);

  /// \brief Set the referent of a symbol.
  ///
  /// If the referent of a symbol is set to null, then the value of the
  /// symbol's payload will be cleared (that is, \ref hasReference will return
  /// false).
  template <typename NodeTy>
  std::enable_if_t<is_supported_type<NodeTy>()> setReferent(NodeTy* N) {
    setReferentFromNode(N);
  }

  /// \brief Set the address of a symbol.
  void setAddress(Addr A);

  /// \brief If true, this symbol is pointing to the end of the referent
  /// rather than at the beginning.
  ///
  /// This value has no meaning for integral symbols.
  bool getAtEnd() const { return AtEnd; }

  /// \brief sets whether or not this symbol is pointing to the end of the
  /// referent rather than at the beginning.
  ///
  /// This value has no meaning for integral symbols.
  void setAtEnd(bool AE) { AtEnd = AE; }

  /// @cond INTERNAL
  static bool classof(const Node* N) { return N->getKind() == Kind::Symbol; }
  /// @endcond

private:
  Symbol(Context& C) : Node(C, Kind::Symbol) {}
  Symbol(Context& C, const std::string& N, bool AE)
      : Node(C, Kind::Symbol), Name(N), AtEnd(AE) {}
  Symbol(Context& C, const std::string& N, bool AE, const UUID& U)
      : Node(C, Kind::Symbol, U), Name(N), AtEnd(AE) {}
  Symbol(Context& C, Addr X, const std::string& N, bool AE)
      : Node(C, Kind::Symbol), Payload(X), Name(N), AtEnd(AE) {}
  template <typename NodeTy>
  Symbol(Context& C, NodeTy* R, const std::string& N, bool AE)
      : Node(C, Kind::Symbol), Payload(R), Name(N), AtEnd(AE) {
    if (!R) {
      Payload = std::monostate{};
    }
  }

  static Symbol* Create(Context& C, const std::string& Name, bool AtEnd,
                        const UUID& U) {
    return C.Create<Symbol>(C, Name, AtEnd, U);
  }

  void setParent(Module* M, SymbolObserver* O) {
    Parent = M;
    Observer = O;
  }

  void setReferentFromNode(Node* N);

  /// \brief The protobuf message type used for serializing Symbol.
  using MessageType = proto::Symbol;

  /// \brief Serialize into a protobuf message.
  ///
  /// \param[out] Message   Serialize into this message.
  ///
  /// \return void
  void toProtobuf(MessageType* Message) const;

  /// \brief Construct a Symbol from a protobuf message.
  ///
  /// \param C   The Context in which the deserialized Symbol will be held.
  /// \param Message  The protobuf message from which to deserialize.
  ///
  /// \return The deserialized Symbol object, or null on failure.
  static ErrorOr<Symbol*> fromProtobuf(Context& C, const MessageType& Message);

  // Present for testing purposes only.
  void save(std::ostream& Out) const;

  // Present for testing purposes only.
  static Symbol* load(Context& C, std::istream& In);

  Module* Parent{nullptr};
  SymbolObserver* Observer{nullptr};
  std::variant<std::monostate, Addr, Node*> Payload;
  std::string Name;
  bool AtEnd = false;

  friend class Context; // Allow Context to construct Symbols.
  friend class Module;  // Allow Module to call setModule, Create, etc.
  // Allows serializaton from Module via containerToProtobuf.
  template <typename T> friend typename T::MessageType toProtobuf(const T&);
  friend class SerializationTestHarness; // Testing support.
};

/// \class SymbolObserver
///
/// \brief Interface for notifying observers when the Symbol is updated.
///

class GTIRB_EXPORT_API SymbolObserver {
public:
  virtual ~SymbolObserver() = default;

  /// \brief Notify parent when the Symbol's name changes.
  ///
  /// Called after the Symbol updates its internal state.
  ///
  /// \param S        the Symbol whose name changed.
  /// \param OldName  the Symbol's previous name.
  /// \param NewName  the new name of the Symbol.
  ///
  /// \return indication of whether the observer accepts the change.
  virtual ChangeStatus nameChange(Symbol* S, const std::string& OldName,
                                  const std::string& NewName) = 0;

  /// \brief Notify parent when the Symbol's referent (Node or Addr) changes.
  ///
  /// Called after the Symbol updates its internal state.
  ///
  /// \param S            the Symbol whose referent changed.
  /// \param OldReferent  the Symbol's previous referent.
  /// \param NewReferent  the new value the Symbol refers to.
  ///
  /// \return indication of whether the observer accepts the change.
  virtual ChangeStatus
  referentChange(Symbol* S,
                 std::variant<std::monostate, Addr, Node*> OldReferent,
                 std::variant<std::monostate, Addr, Node*> NewReferent) = 0;
};

inline void Symbol::setName(const std::string& N) {
  if (Observer) {
    std::string OldName(N);
    std::swap(Name, OldName);
    [[maybe_unused]] ChangeStatus Status =
        Observer->nameChange(this, OldName, Name);
    assert(Status != ChangeStatus::Rejected &&
           "recovering from rejected name change is unsupported");
  } else {
    Name = N;
  }
}

inline void Symbol::setAddress(Addr A) {
  if (Observer) {
    std::variant<std::monostate, Addr, Node*> OldValue = Payload;
    Payload = A;
    [[maybe_unused]] ChangeStatus Status =
        Observer->referentChange(this, OldValue, Payload);
    assert(Status != ChangeStatus::Rejected &&
           "recovering from rejected address change is unsupported");
  } else {
    Payload = A;
  }
}

inline void Symbol::setReferentFromNode(Node* N) {
  std::variant<std::monostate, Addr, Node*> OldValue = Payload;
  if (N) {
    Payload = N;
  } else {
    Payload = std::monostate{};
  }
  if (Observer) {
    [[maybe_unused]] ChangeStatus Status =
        Observer->referentChange(this, OldValue, Payload);
    assert(Status != ChangeStatus::Rejected &&
           "recovering from rejected referent change is unsupported");
  }
}

} // namespace gtirb

#endif // GTIRB_SYMBOL_H


================================================
FILE: include/gtirb/SymbolicExpression.hpp
================================================
//===- SymbolicExpression.hpp -----------------------------------*- C++ -*-===//
//
//  Copyright (C) 2020 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
#ifndef GTIRB_SYMBOLICEXPRESSION_H
#define GTIRB_SYMBOLICEXPRESSION_H

#include <gtirb/Addr.hpp>
#include <gtirb/proto/SymbolicExpression.pb.h>
#include <bitset>
#include <boost/range/iterator_range.hpp>
#include <cstdint>
#include <functional>
#include <map>
#include <string>
#include <variant>

/// \file SymbolicExpression.hpp
/// \ingroup SYMBOLIC_EXPRESSION_GROUP
/// \brief Types and operations for symbolic expressions.
///
/// \see \ref SYMBOLIC_EXPRESSION_GROUP.
namespace gtirb {
class Symbol; // Forward refernece for Sym, Sym1, Sym2, etc.

/// \defgroup SYMBOLIC_EXPRESSION_GROUP Symbolic Expressions and Operands
/// \brief Represent data values or instruction operands which
/// should be intepreted as referring to symbols.
/// @{

/// \enum SymAttribute
///
/// \brief The space of attributes that can be applied to a symbolic
/// expression.
///
/// See doc/general/SymbolicExpression.md for more details.
enum class SymAttribute : uint16_t {
  // Common ELF relocation labels.
  GOT = proto::SymAttribute::GOT,
  GOTPC = proto::SymAttribute::GOTPC,
  GOTOFF = proto::SymAttribute::GOTOFF,
  GOTREL = proto::SymAttribute::GOTREL,
  PLT = proto::SymAttribute::PLT,
  PLTOFF = proto::SymAttribute::PLTOFF,
  PCREL = proto::SymAttribute::PCREL,
  SECREL = proto::SymAttribute::SECREL,
  TLS = proto::SymAttribute::TLS,
  TLSGD = proto::SymAttribute::TLSGD,
  TLSLD = proto::SymAttribute::TLSLD,
  TLSLDM = proto::SymAttribute::TLSLDM,
  TLSCALL = proto::SymAttribute::TLSCALL,
  TLSDESC = proto::SymAttribute::TLSDESC,
  TPREL = proto::SymAttribute::TPREL,
  TPOFF = proto::SymAttribute::TPOFF,
  DTPREL = proto::SymAttribute::DTPREL,
  DTPOFF = proto::SymAttribute::DTPOFF,
  DTPMOD = proto::SymAttribute::DTPMOD,
  NTPOFF = proto::SymAttribute::NTPOFF,
  PAGE = proto::SymAttribute::PAGE,
  PAGEOFF = proto::SymAttribute::PAGEOFF,
  CALL = proto::SymAttribute::CALL,
  LO = proto::SymAttribute::LO,
  HI = proto::SymAttribute::HI,
  HIGHER = proto::SymAttribute::HIGHER,
  HIGHEST = proto::SymAttribute::HIGHEST,

  // X86-specific relocation labels.
  GOTNTPOFF = proto::SymAttribute::GOTNTPOFF,
  INDNTPOFF = proto::SymAttribute::INDNTPOFF,

  // ARM-specific relocation labels.
  G0 = proto::SymAttribute::G0,
  G1 = proto::SymAttribute::G1,
  G2 = proto::SymAttribute::G2,
  G3 = proto::SymAttribute::G3,
  UPPER16 = proto::SymAttribute::UPPER16,
  LOWER16 = proto::SymAttribute::LOWER16,
  LO12 = proto::SymAttribute::LO12,
  LO15 = proto::SymAttribute::LO15,
  LO14 = proto::SymAttribute::LO14,
  HI12 = proto::SymAttribute::HI12,
  HI21 = proto::SymAttribute::HI21,
  S = proto::SymAttribute::S,
  PG = proto::SymAttribute::PG,
  NC = proto::SymAttribute::NC,
  ABS = proto::SymAttribute::ABS,
  PREL = proto::SymAttribute::PREL,
  PREL31 = proto::SymAttribute::PREL31,
  TARGET1 = proto::SymAttribute::TARGET1,
  TARGET2 = proto::SymAttribute::TARGET2,
  SBREL = proto::SymAttribute::SBREL,
  TLSLDO = proto::SymAttribute::TLSLDO,

  // MIPS-specific relocation labels.
  HI16 = proto::SymAttribute::HI16,
  LO16 = proto::SymAttribute::LO16,
  GPREL = proto::SymAttribute::GPREL,
  DISP = proto::SymAttribute::DISP,
  OFST = proto::SymAttribute::OFST,

  // PPC
  H = proto::SymAttribute::H,
  L = proto::SymAttribute::L,
  HA = proto::SymAttribute::HA,
  HIGH = proto::SymAttribute::HIGH,
  HIGHA = proto::SymAttribute::HIGHA,
  HIGHERA = proto::SymAttribute::HIGHERA,
  HIGHESTA = proto::SymAttribute::HIGHESTA,
  TOCBASE = proto::SymAttribute::TOCBASE,
  TOC = proto::SymAttribute::TOC,
  NOTOC = proto::SymAttribute::NOTOC,
};

using SymAttributeSet = std::set<SymAttribute>;

/// \brief Represents a
/// \ref SYMBOLIC_EXPRESSION_GROUP "symbolic operand" of the form
/// "Sym + Offset".
struct SymAddrConst {
  int64_t Offset; ///< Constant offset.
  Symbol* Sym;    ///< Symbol representing an address.
  SymAttributeSet Attributes = SymAttributeSet();

  friend bool operator==(const SymAddrConst& LHS, const SymAddrConst& RHS) {
    return LHS.Offset == RHS.Offset && LHS.Sym == RHS.Sym &&
           LHS.Attributes == RHS.Attributes;
  }

  friend bool operator!=(const SymAddrConst& LHS, const SymAddrConst& RHS) {
    return !operator==(LHS, RHS);
  }
};

/// \brief Represents a
/// \ref SYMBOLIC_EXPRESSION_GROUP "symbolic operand" of the form
/// "(Sym1 - Sym2) / Scale + Offset"
struct SymAddrAddr {
  int64_t Scale;  ///< Constant scale factor.
  int64_t Offset; ///< Constant offset.
  Symbol* Sym1;   ///< Symbol representing the base address.
  Symbol* Sym2;   ///< Symbol to subtract from \p Sym1.
  SymAttributeSet Attributes = SymAttributeSet();

  friend bool operator==(const SymAddrAddr& LHS, const SymAddrAddr& RHS) {
    return LHS.Scale == RHS.Scale && LHS.Offset == RHS.Offset &&
           LHS.Sym1 == RHS.Sym1 && LHS.Sym2 == RHS.Sym2 &&
           LHS.Attributes == RHS.Attributes;
  }

  friend bool operator!=(const SymAddrAddr& LHS, const SymAddrAddr& RHS) {
    return !operator==(LHS, RHS);
  }
};

/// \brief A \ref SYMBOLIC_EXPRESSION_GROUP "symbolic expression".
using SymbolicExpression = std::variant<SymAddrConst, SymAddrAddr>;

/// @}
// (end \defgroup SYMBOLIC_EXPRESSION_GROUP)

} // namespace gtirb

namespace std {
template <> struct hash<gtirb::SymAddrConst> {
  typedef gtirb::SymAddrConst argument_type;
  typedef std::size_t result_type;

  result_type operator()(const argument_type& Obj) const noexcept {
    const result_type Off = std::hash<int64_t>{}(Obj.Offset);
    const result_type P = std::hash<gtirb::Symbol*>{}(Obj.Sym);
    return Off ^ (P << 1);
  }
};

template <> struct hash<gtirb::SymAddrAddr> {
  typedef gtirb::SymAddrAddr argument_type;
  typedef std::size_t result_type;

  result_type operator()(const argument_type& Obj) const noexcept {
    result_type S = std::hash<int64_t>{}(Obj.Scale);
    comb(S, std::hash<int64_t>{}(Obj.Offset));
    comb(S, std::hash<gtirb::Symbol*>{}(Obj.Sym1));
    comb(S, std::hash<gtirb::Symbol*>{}(Obj.Sym2));
    return S;
  }

private:
  void comb(result_type& One, result_type Two) const noexcept {
    One ^= Two + 0x9e3779b9 + (One << 6) + (One >> 2);
  }
};
} // namespace std

#endif // GTIRB_SYMBOLICEXPRESSION_H


================================================
FILE: include/gtirb/Utility.hpp
================================================
//===- Utility.hpp ----------------------------------------------*- C++ -*-===//
//
//  Copyright (C) 2021 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
#ifndef GTIRB_UTILITY_H
#define GTIRB_UTILITY_H

#include <gtirb/Addr.hpp>
#include <gtirb/Export.hpp>
#include <gtirb/Node.hpp>
#include <algorithm>
#include <boost/iterator/iterator_categories.hpp>
#include <boost/iterator/iterator_facade.hpp>
#include <boost/iterator/iterator_traits.hpp>
#include <boost/iterator/transform_iterator.hpp>
#include <boost/range/iterator_range.hpp>
#include <functional>
#include <iterator>
#include <optional>
#include <type_traits>
#include <vector>

namespace gtirb {

/// @cond INTERNAL

/// \class MergeSortedIterator
///
/// \brief This iterator merges a set of sorted iterators together, producing
/// a single sorted output iterator.
///
/// This iterator is a forward iterator, irrespective of the class of the base
/// iterator. Iterating over a sequence of N total elements from a combined M
/// base iterators requires O(N log M) comparisons. Constructing a iterator
/// with M base iterators requires O(M) comparisons.
///
/// \tparam ForwardIterator The type of forward iterator to be merged. Results
///                         from these iterators must be in sorted order.
/// \tparam Compare         A comparison function object to use to sort results.
///                         Defaults to std::less.
template <typename ForwardIterator,
          typename Compare = std::less<
              typename std::iterator_traits<ForwardIterator>::value_type>>
class MergeSortedIterator
    : public boost::iterator_facade<
          MergeSortedIterator<ForwardIterator, Compare>,
          typename std::iterator_traits<ForwardIterator>::value_type,
          boost::forward_traversal_tag,
          typename std::iterator_traits<ForwardIterator>::reference,
          typename std::iterator_traits<ForwardIterator>::difference_type> {
public:
  /// \brief Create a MergeSortedIterator representing the end of iteration.
  ///
  /// Dereferencing or incrementing this iterator results in undefined behavior.
  MergeSortedIterator() = default;

  /// \brief Converting constructor from a MergeSortedIterator with a compatible
  /// base iterator type.
  ///
  /// This allows converting a non-const iterator to a const iterator, for
  /// example, as long as the base iterators are convertible. The comparison
  /// types must match exactly.
  ///
  /// \tparam OtherForwardIterator  base iterator type of the
  /// MergeSortedIterator to convert.
  ///
  /// \param MSI  MergeSortedIterator to convert.
  template <typename OtherForwardIterator>
  MergeSortedIterator(
      const MergeSortedIterator<OtherForwardIterator, Compare>& MSI,
      std::enable_if_t<
          std::is_convertible_v<OtherForwardIterator, ForwardIterator>, void*> =
          0)
      : Ranges(MSI.Ranges.begin(), MSI.Ranges.end()) {}

  /// \brief Create a MergeSortedIterator from a range of ranges.
  ///
  /// \tparam RangeIteratorRange Any class fulfilling the Boost concept
  /// SinglePassRange<SinglePassIterator<SinglePassRange<ForwardIterator>>>.
  ///
  /// \param RangeRange A \p RangeIteratorRange to build this iterator from.
  template <typename RangeIteratorRange>
  explicit MergeSortedIterator(RangeIteratorRange RangeRange) {
    for (const auto& Range : RangeRange) {
      if (auto RBegin = Range.begin(), REnd = Range.end(); RBegin != REnd) {
        Ranges.emplace_back(RBegin, REnd);
      }
    }
    // Establish the heap invariant for Ranges.
    std::make_heap(Ranges.begin(), Ranges.end(), rangeGreaterThan);
  }

  /// \brief Create a MergeSortedIterator from an iterator of ranges.
  ///
  /// \tparam RangeIterator Any class fulfilling the Boost concept
  /// SinglePassIterator<SinglePassRange<ForwardIterator>>.
  ///
  /// \param Begin The beginning of the ranges to build this iterator from.
  /// \param End   The end of the ranges to build this iterator from.
  template <typename RangeIterator>
  MergeSortedIterator(RangeIterator Begin, RangeIterator End)
      : MergeSortedIterator(boost::make_iterator_range(Begin, End)) {}

  // Beginning of functions for iterator facade compatibility.
  typename std::iterator_traits<ForwardIterator>::reference
  dereference() const {
    assert(!Ranges.empty() && "Attempt to dereference end of iterator!");
    return *Ranges.front().first;
  }

  bool equal(const MergeSortedIterator<ForwardIterator, Compare>& Other) const {
    return Ranges == Other.Ranges;
  }

  void increment() {
    assert(!Ranges.empty() && "Attempt to increment end of iterator!");
    // After incrementing the first range, it may no longer have the lowest
    // first element. Removing the range, then re-inserting it ensures that the
    // heap invariant is maintained.
    std::pop_heap(Ranges.begin(), Ranges.end(), rangeGreaterThan);
    ++Ranges.back().first;
    if (Ranges.back().first == Ranges.back().second) {
      Ranges.pop_back();
    } else {
      std::push_heap(Ranges.begin(), Ranges.end(), rangeGreaterThan);
    }
  }
  // End of functions for iterator facade compatibility.
private:
  template <typename OtherForwardIterator, typename OtherCompare>
  friend class MergeSortedIterator;

  using RangeType = std::pair<ForwardIterator, ForwardIterator>;

  // Compares two ranges according to the relationship of their first elements
  // given by \c Compare. Empty ranges are treated as being greater than any
  // non-empty range.
  static bool rangeGreaterThan(const RangeType& R1, const RangeType& R2) {
    if (R1.first == R1.second)
      // An empty R1 is greater than every R2.
      return true;
    if (R2.first == R2.second)
      // Any R1 is less than an empty R2.
      return false;
    // Flip the comparison to implement "greater-than".
    return Compare()(*R2.first, *R1.first);
  }

  // Ranges is a heap ordered by \c rangeGreaterThan. This ensures that the
  // range with the lowest first element (according to \c Compare) is always at
  // the front.
  std::vector<RangeType> Ranges;
};

/// \class AddressLess
///
/// \brief A comparison function object for comparing nodes in address order.
///
/// If both nodes have the same address, their sizes are compared. If both
/// nodes have the same addresses and sizes, their UUIDs are compared.
struct GTIRB_EXPORT_API AddressLess {
  template <typename NodeType> auto key(const NodeType* N) const {
    return std::make_tuple(N->getAddress(), N->getSize(), N->getUUID());
  }

  template <typename NodeType>
  bool operator()(const NodeType* N1, const NodeType* N2) const {
    return key(N1) < key(N2);
  }

  template <typename NodeType,
            typename = std::enable_if_t<!std::is_pointer_v<NodeType>>>
  bool operator()(const NodeType& N1, const NodeType& N2) const {
    return operator()(&N1, &N2);
  }

  /// \brief Compare a node's address to a query address.
  template <typename NodeType>
  bool operator()(const NodeType* N1, const Addr& A2) const {
    return N1->getAddress() < A2;
  }

  /// \brief Compare a node's address to a query address.
  template <typename NodeType>
  bool operator()(const Addr& A1, const NodeType* N2) const {
    return A1 < N2->getAddress();
  }
};

/// \brief Compare CodeBlocks by address, size, decode mode, and UUID.
template <>
GTIRB_EXPORT_API bool
AddressLess::operator()<CodeBlock>(const CodeBlock* B1,
                                   const CodeBlock* B2) const;

/// \brief Compare DataBlocks by address, size, and UUID.
///
/// Although this mimics the default comparison order, this specialization is
/// necessary for compatibility with the CodeBlock order so that CodeBlocks
/// and DataBlocks can be handled uniformly by block_iterator and friends.
template <>
GTIRB_EXPORT_API bool
AddressLess::operator()<DataBlock>(const DataBlock* B1,
                                   const DataBlock* B2) const;

/// \class BlockAddressLess
///
/// \brief A comparison function object for comparing blocks (that is, \ref Node
/// objects that are either \ref CodeBlock or \ref DataBlock objects) in
/// address order.
struct GTIRB_EXPORT_API BlockAddressLess {
  bool operator()(const Node* N1, const Node* N2) const;
  bool operator()(const Node& N1, const Node& N2) const {
    return operator()(&N1, &N2);
  }
};

/// \class BlockOffsetPairLess
///
/// \brief A comparison function object for comparing blocks in a ByteInterval
/// in offset order.
struct GTIRB_EXPORT_API BlockOffsetPairLess {
  bool operator()(std::pair<uint64_t, const Node*> B1,
                  std::pair<uint64_t, const Node*> B2) const;
};

/// \class ArbitraryLess
///
/// \brief A comparison function object for comparing objects in a manner with
/// no ordering guarantees.
///
/// \tparam T Any type.
template <typename T> struct ArbitraryLess {
  bool operator()(const T& N1, const T& N2) const { return &N1 < &N2; }
};

/// \class NodeToChildRange
///
/// \brief A function object for constructing \ref MergeSortedIterator objects
/// via Boost transform iterators.
///
/// \tparam T The type to retrieve a range of children nodes from.
/// \tparam Method A pointer-to-method type, taking no arguments and retuning
///                a child node iterator.
/// \tparam Begin  A pointer-to-method of the beginning of the child node range.
/// \tparam End    A pointer-to-method of the end of the child node range.
template <typename T, typename Method, Method Begin, Method End>
struct NodeToChildRange {
  boost::iterator_range<decltype((std::declval<T>().*Begin)())>
  operator()(T& N) const {
    return boost::make_iterator_range((N.*Begin)(), (N.*End)());
  }
};

/// \class NodeToBlockRange
///
/// \brief A function object for constructing \ref MergeSortedIterator objects
/// via Boost transform iterators. Returns ranges of \ref Node objects, which
/// are either \ref CodeBlock objects or \ref DataBlock objects.
///
/// \tparam T The type to retrieve ranges of blocks from. If const-qualified,
///           the const iterators on this type are used; else the non-const
///           iterators are used.
template <typename T>
using NodeToBlockRange = NodeToChildRange<
    T,
    std::conditional_t<std::is_const_v<T>,
                       typename T::const_block_iterator (T::*)() const,
                       typename T::block_iterator (T::*)()>,
    &T::blocks_begin, &T::blocks_end>;

/// \class NodeToCodeBlockRange
///
/// \brief A function object for constructing \ref MergeSortedIterator objects
/// via Boost transform iterators. Returns ranges of \ref CodeBlock objects.
///
/// \tparam T The type to retrieve ranges of blocks from. If const-qualified,
///           the const iterators on this type are used; else the non-const
///           iterators are used.
template <typename T>
using NodeToCodeBlockRange = NodeToChildRange<
    T,
    std::conditional_t<std::is_const_v<T>,
                       typename T::const_code_block_iterator (T::*)() const,
                       typename T::code_block_iterator (T::*)()>,
    &T::code_blocks_begin, &T::code_blocks_end>;

/// \class NodeToDataBlockRange
///
/// \brief A function object for constructing \ref MergeSortedIterator objects
/// via Boost transform iterators. Returns ranges of \ref DataBlock objects.
///
/// \tparam T The type to retrieve ranges of blocks from. If const-qualified,
///           the const iterators on this type are used; else the non-const
///           iterators are used.
template <typename T>
using NodeToDataBlockRange = NodeToChildRange<
    T,
    std::conditional_t<std::is_const_v<T>,
                       typename T::const_data_block_iterator (T::*)() const,
                       typename T::data_block_iterator (T::*)()>,
    &T::data_blocks_begin, &T::data_blocks_end>;

/// \class NodeToSymbolicExpressionRange
///
/// \brief A function object for constructing \ref MergeSortedIterator objects
/// via Boost transform iterators. Returns ranges of \ref
/// ByteInterval::SymbolicExpressionElement or \ref
/// ByteInterval::ConstSymbolicExpressionElement objects.
///
/// \tparam T The type to retrieve ranges of symbolic expressions from. If
///           const-qualified, the const iterators on this type are used; else
///           the non-const iterators are used.
template <typename T>
using NodeToSymbolicExpressionRange = NodeToChildRange<
    T,
    std::conditional_t<std::is_const_v<T>,
                       typename T::const_symbolic_expression_iterator (T::*)()
                           const,
                       typename T::symbolic_expression_iterator (T::*)()>,
    &T::symbolic_expressions_begin, &T::symbolic_expressions_end>;

/// \class NodeToByteIntervalRange
///
/// \brief A function object for constructing \ref MergeSortedIterator objects
/// via Boost transform iterators. Returns ranges of \ref ByteInterval objects.
///
/// \tparam T The type to retrieve ranges of intervals from. If const-qualified,
///           the const iterators on this type are used; else the non-const
///           iterators are used.
template <typename T>
using NodeToByteIntervalRange = NodeToChildRange<
    T,
    std::conditional_t<std::is_const_v<T>,
                       typename T::const_byte_interval_iterator (T::*)() const,
                       typename T::byte_interval_iterator (T::*)()>,
    &T::byte_intervals_begin, &T::byte_intervals_end>;

/// \class NodeToSymbolRange
///
/// \brief A function object for constructing \ref MergeSortedIterator objects
/// via Boost transform iterators. Returns ranges of \ref Symbol objects.
///
/// \tparam T The type to retrieve ranges of symbols from. If const-qualified,
///           the const iterators on this type are used; else the non-const
///           iterators are used.
template <typename T>
using NodeToSymbolRange = NodeToChildRange<
    T,
    std::conditional_t<std::is_const_v<T>,
                       typename T::const_symbol_iterator (T::*)() const,
                       typename T::symbol_iterator (T::*)()>,
    &T::symbols_begin, &T::symbols_end>;

/// \class NodeToSectionRange
///
/// \brief A function object for constructing \ref MergeSortedIterator objects
/// via Boost transform iterators. Returns ranges of \ref Section objects.
///
/// \tparam T The type to retrieve ranges of sections from. If const-qualified,
///           the const iterators on this type are used; else the non-const
///           iterators are used.
template <typename T>
using NodeToSectionRange = NodeToChildRange<
    T,
    std::conditional_t<std::is_const_v<T>,
                       typename T::const_section_iterator (T::*)() const,
                       typename T::section_iterator (T::*)()>,
    &T::sections_begin, &T::sections_end>;

/// \class NodeToProxyBlockRange
///
/// \brief A function object for constructing \ref MergeSortedIterator objects
/// via Boost transform iterators. Returns ranges of \ref ProxyBlock objects.
///
/// \tparam T The type to retrieve ranges of blocks from. If const-qualified,
///           the const iterators on this type are used; else the non-const
///           iterators are used.
template <typename T>
using NodeToProxyBlockRange = NodeToChildRange<
    T,
    std::conditional_t<std::is_const_v<T>,
                       typename T::const_proxy_block_iterator (T::*)() const,
                       typename T::proxy_block_iterator (T::*)()>,
    &T::proxy_blocks_begin, &T::proxy_blocks_end>;

/// \class FindNodesAt
///
/// \brief A function object for merging together calls to "findNodeAt" style
/// methods, taking one address parameter.
///
/// \tparam T The type of node to call \p FindAtMethod on.
/// \tparam MethodType The type of \p Method.
/// \tparam Method A pointer to a method on \p T that takes an
/// address and returns a range.
template <typename T, typename MethodType, MethodType Method>
struct FindNodesAt {
  Addr A;

  FindNodesAt(Addr A_) : A{A_} {}

  decltype((std::declval<T>().*Method)(Addr())) operator()(T& N) const {
    return (N.*Method)(A);
  }
};

/// \class FindNodes
///
/// \brief A function object for merging together calls to "findNode" style
/// methods, taking one string parameter.
///
/// \tparam T The type of node to call \p FindMethod on.
/// \tparam MethodType The type of \p Method.
/// \tparam Method A pointer to a method on \p T that takes a
/// string and returns a range.
template <typename T, typename MethodType, MethodType Method> struct FindNodes {
  std::string X;

  FindNodes(std::string X_) : X{X_} {}

  decltype((std::declval<T>().*Method)(std::string())) operator()(T& N) const {
    return (N.*Method)((std::string&)X);
  }
};

/// \class FindNodesBetween
///
/// \brief A function object for merging together calls to "findNodeAt" style
/// methods, taking two address parameters.
///
/// \tparam T The type of node to call \p FindAtMethod on.
/// \tparam MethodType The type of \p Method.
/// \tparam Method A pointer to a method on \p T that takes two
/// addresses and returns a range.
template <typename T, typename MethodType, MethodType Method>
struct FindNodesBetween {
  Addr Low, High;

  FindNodesBetween(Addr Low_, Addr High_) : Low{Low_}, High{High_} {}

  decltype((std::declval<T>().*Method)(Addr(), Addr())) operator()(T& N) const {
    return (N.*Method)(Low, High);
  }
};

/// \class FindBlocksIn
///
/// \brief A function object for merging together calls to findBlocksOn.
///
/// \tparam T The node to call findBlocksOn from. If const-qualified,
///           the const functions on this type are used; else the non-const
///           functions are used.
template <typename T>
using FindBlocksIn = FindNodesAt<
    T,
    std::conditional_t<std::is_const_v<T>,
                       typename T::const_block_subrange (T::*)(Addr) const,
                       typename T::block_subrange (T::*)(Addr)>,
    &T::findBlocksOn>;

/// \class FindBlocksAt
///
/// \brief A function object for merging together calls to findBlocksAt, taking
/// one address parameter.
///
/// \tparam T The node to call findBlocksAt from. If const-qualified,
///           the const functions on this type are used; else the non-const
///           functions are used.
template <typename T>
using FindBlocksAt = FindNodesAt<
    T,
    std::conditional_t<std::is_const_v<T>,
                       typename T::const_block_range (T::*)(Addr) const,
                       typename T::block_range (T::*)(Addr)>,
    &T::findBlocksAt>;

/// \class FindBlocksBetween
///
/// \brief A function object for merging together calls to findBlocksAt, taking
/// two address parameters.
///
/// \tparam T The node to call findBlocksAt from. If const-qualified,
///           the const functions on this type are used; else the non-const
///           functions are used.
template <typename T>
using FindBlocksBetween = FindNodesBetween<
    T,
    std::conditional_t<std::is_const_v<T>,
                       typename T::const_block_range (T::*)(Addr, Addr) const,
                       typename T::block_range (T::*)(Addr, Addr)>,
    &T::findBlocksAt>;

/// \class FindCodeBlocksIn
///
/// \brief A function object for merging together calls to findCodeBlocksOn.
///
/// \tparam T The node to call findCodeBlocksOn from. If const-qualified,
///           the const functions on this type are used; else the non-const
///           functions are used.
template <typename T>
using FindCodeBlocksIn = FindNodesAt<
    T,
    std::conditional_t<std::is_const_v<T>,
                       typename T::const_code_block_subrange (T::*)(Addr) const,
                       typename T::code_block_subrange (T::*)(Addr)>,
    &T::findCodeBlocksOn>;

/// \class FindCodeBlocksAt
///
/// \brief A function object for merging together calls to findCodeBlocksAt,
/// taking one address parameter.
///
/// \tparam T The node to call findCodeBlocksAt from. If const-qualified,
///           the const functions on this type are used; else the non-const
///           functions are used.
template <typename T>
using FindCodeBlocksAt = FindNodesAt<
    T,
    std::conditional_t<std::is_const_v<T>,
                       typename T::const_code_block_range (T::*)(Addr) const,
                       typename T::code_block_range (T::*)(Addr)>,
    &T::findCodeBlocksAt>;

/// \class FindCodeBlocksBetween
///
/// \brief A function object for merging together calls to findCodeBlocksAt,
/// taking two address parameters.
///
/// \tparam T The node to call findCodeBlocksAt from. If const-qualified,
///           the const functions on this type are used; else the non-const
///           functions are used.
template <typename T>
using FindCodeBlocksBetween = FindNodesBetween<
    T,
    std::conditional_t<std::is_const_v<T>,
                       typename T::const_code_block_range (T::*)(Addr, Addr)
                           const,
                       typename T::code_block_range (T::*)(Addr, Addr)>,
    &T::findCodeBlocksAt>;

/// \class FindDataBlocksIn
///
/// \brief A function object for merging together calls to findDataBlocksOn.
///
/// \tparam T The node to call findDataBlocksOn from. If const-qualified,
///           the const functions on this type are used; else the non-const
///           functions are used.
template <typename T>
using FindDataBlocksIn = FindNodesAt<
    T,
    std::conditional_t<std::is_const_v<T>,
                       typename T::const_data_block_subrange (T::*)(Addr) const,
                       typename T::data_block_subrange (T::*)(Addr)>,
    &T::findDataBlocksOn>;

/// \class FindDataBlocksAt
///
/// \brief A function object for merging together calls to findDataBlocksAt,
/// taking one address parameter.
///
/// \tparam T The node to call findDataBlocksAt from. If const-qualified,
///           the const functions on this type are used; else the non-const
///           functions are used.
template <typename T>
using FindDataBlocksAt = FindNodesAt<
    T,
    std::conditional_t<std::is_const_v<T>,
                       typename T::const_data_block_range (T::*)(Addr) const,
                       typename T::data_block_range (T::*)(Addr)>,
    &T::findDataBlocksAt>;

/// \class FindDataBlocksBetween
///
/// \brief A function object for merging together calls to findDataBlocksAt,
/// taking two address parameters.
///
/// \tparam T The node to call findDataBlocksAt from. If const-qualified,
///           the const functions on this type are used; else the non-const
///           functions are used.
template <typename T>
using FindDataBlocksBetween = FindNodesBetween<
    T,
    std::conditional_t<std::is_const_v<T>,
                       typename T::const_data_block_range (T::*)(Addr, Addr)
                           const,
                       typename T::data_block_range (T::*)(Addr, Addr)>,
    &T::findDataBlocksAt>;

/// \class FindSymExprsAt
///
/// \brief A function object for merging together calls to
/// findSymbolicExpressionsAt, taking one address parameter.
///
/// \tparam T The node to call findSymbolicExpressionsAt from. If
/// const-qualified, the const functions on this type are used; else the
/// non-const functions are used.
template <typename T>
using FindSymExprsAt = FindNodesAt<
    T,
    std::conditional_t<std::is_const_v<T>,
                       typename T::const_symbolic_expression_range (T::*)(Addr)
                           const,
                       typename T::symbolic_expression_range (T::*)(Addr)>,
    &T::findSymbolicExpressionsAt>;

/// \class FindSymExprsBetween
///
/// \brief A function object for merging together calls to
/// findSymbolicExpressionsAt, taking two address parameters.
///
/// \tparam T The node to call findSymbolicExpressionsAt from. If
/// const-qualified, the const functions on this type are used; else the
/// non-const functions are used.
template <typename T>
using FindSymExprsBetween = FindNodesBetween<
    T,
    std::conditional_t<
        std::is_const_v<T>,
        typename T::const_symbolic_expression_range (T::*)(Addr, Addr) const,
        typename T::symbolic_expression_range (T::*)(Addr, Addr)>,
    &T::findSymbolicExpressionsAt>;

/// \class FindByteIntervalsIn
///
/// \brief A function object for merging together calls to findByteIntervalsOn.
///
/// \tparam T The node to call findByteIntervalsOn from. If const-qualified,
///           the const functions on this type are used; else the non-const
///           functions are used.
template <typename T>
using FindByteIntervalsIn =
    FindNodesAt<T,
                std::conditional_t<
                    std::is_const_v<T>,
                    typename T::const_byte_interval_subrange (T::*)(Addr) const,
                    typename T::byte_interval_subrange (T::*)(Addr)>,
                &T::findByteIntervalsOn>;

/// \class FindByteIntervalsAt
///
/// \brief A function object for merging together calls to
/// findByteIntervalsAt, taking one address parameter.
///
/// \tparam T The node to call findByteIntervalsAt from. If
/// const-qualified, the const functions on this type are used; else the
/// non-const functions are used.
template <typename T>
using FindByteIntervalsAt = FindNodesAt<
    T,
    std::conditional_t<std::is_const_v<T>,
                       typename T::const_byte_interval_range (T::*)(Addr) const,
                       typename T::byte_interval_range (T::*)(Addr)>,
    &T::findByteIntervalsAt>;

/// \class FindByteIntervalsBetween
///
/// \brief A function object for merging together calls to
/// findByteIntervalsAt, taking two address parameters.
///
/// \tparam T The node to call findByteIntervalsAt from. If
/// const-qualified, the const functions on this type are used; else the
/// non-const functions are used.
template <typename T>
using FindByteIntervalsBetween = FindNodesBetween<
    T,
    std::conditional_t<std::is_const_v<T>,
                       typename T::const_byte_interval_range (T::*)(Addr, Addr)
                           const,
                       typename T::byte_interval_range (T::*)(Addr, Addr)>,
    &T::findByteIntervalsAt>;

/// \class FindSectionsIn
///
/// \brief A function object for merging together calls to findSectionsOn.
///
/// \tparam T The node to call findSectionsOn from. If const-qualified,
///           the const functions on this type are used; else the non-const
///           functions are used.
template <typename T>
using FindSectionsIn = FindNodesAt<
    T,
    std::conditional_t<std::is_const_v<T>,
                       typename T::const_section_subrange (T::*)(Addr) const,
                       typename T::section_subrange (T::*)(Addr)>,
    &T::findSectionsOn>;

/// \class FindSectionsAt
///
/// \brief A function object for merging together calls to
/// findSectionsAt, taking one address parameter.
///
/// \tparam T The node to call findSectionsAt from. If
/// const-qualified, the const functions on this type are used; else the
/// non-const functions are used.
template <typename T>
using FindSectionsAt = FindNodesAt<
    T,
    std::conditional_t<std::is_const_v<T>,
                       typename T::const_section_range (T::*)(Addr) const,
                       typename T::section_range (T::*)(Addr)>,
    &T::findSectionsAt>;

/// \class FindSections
///
/// \brief A function object for merging together calls to
/// findSections, taking one string parameter.
///
/// \tparam T The node to call findSections from. If
/// const-qualified, the const functions on this type are used; else the
/// non-const functions are used.
template <typename T>
using FindSections = FindNodes<
    T,
    std::conditional_t<
        std::is_const_v<T>,
        typename T::const_section_name_range (T::*)(const std::string& X) const,
        typename T::section_name_range (T::*)(const std::string& X)>,
    &T::findSections>;

/// \class FindSectionsBetween
///
/// \brief A function object for merging together calls to
/// findSectionsAt, taking two address parameters.
///
/// \tparam T The node to call findSectionsAt from. If
/// const-qualified, the const functions on this type are used; else the
/// non-const functions are used.
template <typename T>
using FindSectionsBetween = FindNodesBetween<
    T,
    std::conditional_t<std::is_const_v<T>,
                       typename T::const_section_range (T::*)(Addr, Addr) const,
                       typename T::section_range (T::*)(Addr, Addr)>,
    &T::findSectionsAt>;

/// @endcond

} // namespace gtirb

#endif // GTIRB_UTILITY_H


================================================
FILE: include/gtirb/gtirb.hpp
================================================
//===- gtirb.hpp ------------------------------------------------*- C++ -*-===//
//
//  Copyright (C) 2020 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
#ifndef GTIRB_GTIRB_H
#define GTIRB_GTIRB_H

/// \file gtirb.hpp
/// \brief \c \#include this file to include all GTIRB API headers.

/// \namespace gtirb
/// \brief Main namespace for the GTIRB API.

#include <gtirb/Addr.hpp>
#include <gtirb/AuxData.hpp>
#include <gtirb/AuxDataSchema.hpp>
#include <gtirb/ByteInterval.hpp>
#include <gtirb/CFG.hpp>
#include <gtirb/CodeBlock.hpp>
#include <gtirb/DataBlock.hpp>
#include <gtirb/Export.hpp>
#include <gtirb/IR.hpp>
#include <gtirb/Module.hpp>
#include <gtirb/Node.hpp>
#include <gtirb/Section.hpp>
#include <gtirb/Symbol.hpp>
#include <gtirb/SymbolicExpression.hpp>

#include <gtirb/version.h>

#endif // GTIRB_GTIRB_H


================================================
FILE: include/gtirb/version.h.in
================================================
//===- version.h -------------------------------------------------*- C++-*-===//
//
//  Copyright (C) 2020 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//

#ifndef GTIRB_VERSION_H
#define GTIRB_VERSION_H

/**@def GTIRB_MAJOR_VERSION
   Major Version
*/
#define GTIRB_MAJOR_VERSION @PROJECT_VERSION_MAJOR@

/**@def GTIRB_MINOR_VERSION
   Minor Version
*/
#define GTIRB_MINOR_VERSION @PROJECT_VERSION_MINOR@

/**@def GTIRB_PATCH_VERSION
   Patch Version
*/
#define GTIRB_PATCH_VERSION @PROJECT_VERSION_PATCH@

/// \file version.h
/// \brief Holds the version macros. Read from version.txt

/**@def GTIRB_VERSION_STRING
   Full version
*/
#define GTIRB_VERSION_STRING                                                   \
  "@PROJECT_VERSION_MAJOR@.@PROJECT_VERSION_MINOR@.@PROJECT_VERSION_PATCH@"

/**@def GTIRB_PROTOBUF_VERSION
 * The version of the Protobuf files produced by this API.
*/
#define GTIRB_PROTOBUF_VERSION @GTIRB_PROTOBUF_VERSION@

#endif


================================================
FILE: java/.gitignore
================================================
.idea
.gradle
gradle
gradlew
gradlew.bat


================================================
FILE: java/CMakeLists.txt
================================================
#
# Cmake configuration for java build
#

# ---------------------------------------------------------------------------
# Get upper bound of compatible versions
# ---------------------------------------------------------------------------

if("${Protobuf_VERSION}" VERSION_LESS 3.21.7)
  # Before 3.21.7, generated code is incompatible with the 4.* API.
  set(GTIRB_PROTOBUF_UPPER_BOUND "4.0.0-rc-1")
else()
  # Upper bound for 3.21.7 and above is not yet known.
  set(GTIRB_PROTOBUF_UPPER_BOUND "")
endif()

# ---------------------------------------------------------------------------
# Building the gtirb protobuf files into java
# ---------------------------------------------------------------------------
set(GTIRB_JAVA_SOURCE_DIR ${CMAKE_CURRENT_BINARY_DIR}/src)

# Directory containing the *.class files generated from the *.proto files
set(GTIRB_PROTO_CLASS_DIR "${GTIRB_JAVA_SOURCE_DIR}/com/grammatech/gtirb/proto")

# Add commands to compile the *.proto files to *.class files
foreach(GTIRB_PROTO_FILE ${GTIRB_PROTO_FILES})
  get_filename_component(GTIRB_PROTO_BASENAME ${GTIRB_PROTO_FILE} NAME_WE)
  set(GTIRB_PROTO_CLASS_FILE
      ${GTIRB_PROTO_CLASS_DIR}/${GTIRB_PROTO_BASENAME}OuterClass.java
  )
  add_custom_command(
    OUTPUT ${GTIRB_PROTO_CLASS_FILE}
    COMMAND ${Protobuf_PROTOC_EXECUTABLE} --java_out=${GTIRB_JAVA_SOURCE_DIR}
            --proto_path=${GTIRB_PROTO_DIR} ${GTIRB_PROTO_FILE}
  )
  list(APPEND GTIRB_PROTOBUF_JAVA ${GTIRB_PROTO_CLASS_FILE})
endforeach()

# ---------------------------------------------------------------------------
# Building the gtirb java API
# ---------------------------------------------------------------------------
if(GTIRB_RELEASE_VERSION)
  set(GTIRB_JAVA_SNAPSHOT_SUFFIX "")
else()
  set(GTIRB_JAVA_SNAPSHOT_SUFFIX "-SNAPSHOT")
endif()

configure_file(
  ${CMAKE_CURRENT_SOURCE_DIR}/pom.xml.in ${CMAKE_CURRENT_BINARY_DIR}/pom.xml
  @ONLY
)

set(GTIRB_API_JAVAS
    auxdatacodec/BoolCodec
    auxdatacodec/ByteCodec
    auxdatacodec/Codec
    auxdatacodec/FloatCodec
    auxdatacodec/IntegerCodec
    auxdatacodec/ListCodec
    auxdatacodec/LongCodec
    auxdatacodec/MapCodec
    auxdatacodec/OffsetCodec
    auxdatacodec/SetCodec
    auxdatacodec/ShortCodec
    auxdatacodec/StringCodec
    auxdatacodec/Tuple1Codec
    auxdatacodec/Tuple2Codec
    auxdatacodec/Tuple3Codec
    auxdatacodec/Tuple4Codec
    auxdatacodec/Tuple5Codec
    auxdatacodec/UuidCodec
    auxdatacodec/Variant2Codec
    auxdatacodec/Variant3Codec
    auxdatacodec/Variant11Codec
    tuple/Tuple1
    tuple/Tuple2
    tuple/Tuple3
    tuple/Tuple4
    tuple/Tuple5
    variant/Token
    variant/Variant2
    variant/Variant3
    variant/Variant11
    AuxDataContainer
    AuxDataSchema
    AuxDataSchemas
    ByteBlock
    ByteInterval
    CFG
    CfiDirective
    CodeBlock
    DataBlock
    Edge
    SectionPropertyTuple
    ElfSymbolInfoTuple
    ElfSymbolVersionsTable
    IR
    Module
    Node
    Offset
    PeExportEntry
    PeImportEntry
    PeResourceEntry
    ProbFuncName
    ProxyBlock
    Section
    SymAddrAddr
    SymAddrConst
    SymbolicExpression
    Symbol
    TreeListItem
    TreeListUtils
    TypeTableEntry
    Util
)

foreach(GTIRB_API_JAVA ${GTIRB_API_JAVAS})
  configure_file(
    ${CMAKE_CURRENT_SOURCE_DIR}/com/grammatech/gtirb/${GTIRB_API_JAVA}.java
    ${GTIRB_JAVA_SOURCE_DIR}/com/grammatech/gtirb/${GTIRB_API_JAVA}.java
    COPYONLY
  )
endforeach()

# ---------------------------------------------------------------------------
# Creating a version file to report version information
# ---------------------------------------------------------------------------
configure_file(
  ${CMAKE_CURRENT_SOURCE_DIR}/Version.java.in
  ${GTIRB_JAVA_SOURCE_DIR}/com/grammatech/gtirb/Version.java @ONLY
)

# Append generated Version.java
list(APPEND GTIRB_API_JAVAS Version)

foreach(GTIRB_API_JAVA ${GTIRB_API_JAVAS})
  list(
    APPEND GTIRB_API_SOURCES
           ${GTIRB_JAVA_SOURCE_DIR}/com/grammatech/gtirb/${GTIRB_API_JAVA}.java
  )
endforeach()

set(GTIRB_JAVA_API_VERSION
    "${PROJECT_VERSION_MAJOR}.${PROJECT_VERSION_MINOR}.${PROJECT_VERSION_PATCH}"
)
set(TARGET_DIR "${CMAKE_CURRENT_BINARY_DIR}/target")
set(GTIRB_JAVA_APIDOCS_DIR
    "${TARGET_DIR}/apidocs"
    PARENT_SCOPE
)

set(GTIRB_JAVA_API_JARS
    "${TARGET_DIR}/gtirb_api-${GTIRB_JAVA_API_VERSION}.jar"
    "${TARGET_DIR}/gtirb_api-${GTIRB_JAVA_API_VERSION}-sources.jar"
    "${TARGET_DIR}/gtirb_api-${GTIRB_JAVA_API_VERSION}-javadoc.jar"
)

if(NOT GTIRB_DOCUMENTATION)
  set(MAVEN_PACKAGE_ARGS "-Dmaven.javadoc.skip=true")
endif()

add_custom_command(
  OUTPUT ${GTIRB_JAVA_API_JARS} ${GTIRB_JAVA_APIDOCS_DIR}/index.html
  COMMAND ${MVN} package ${MAVEN_PACKAGE_ARGS}
  WORKING_DIRECTORY "${CMAKE_CURRENT_BINARY_DIR}"
  DEPENDS ${GTIRB_API_SOURCES} ${GTIRB_PROTOBUF_JAVA}
)

add_custom_target(gtirb-java-api ALL DEPENDS ${GTIRB_JAVA_API_JARS})

# ---------------------------------------------------------------------------
# Building the test code
# ---------------------------------------------------------------------------

if(GTIRB_ENABLE_TESTS)
  if(WIN32)
    set(DIR_SEP "\;")
  else()
    set(DIR_SEP ":")
  endif()

  execute_process(
    COMMAND ${MVN} -q exec:exec -Dexec.classpathScope=compile
            -Dexec.executable=echo -Dexec.args=%classpath
    WORKING_DIRECTORY "${CMAKE_CURRENT_BINARY_DIR}"
    OUTPUT_VARIABLE JAR_FILE_LIST
  )
  string(STRIP ${JAR_FILE_LIST} JAR_FILE_LIST)

  file(COPY ${CMAKE_CURRENT_SOURCE_DIR}/tests/
       DESTINATION ${CMAKE_CURRENT_BINARY_DIR}/tests
  )

  set(GTIRB_JAVA_TESTS
      TestAuxData
      TestByteIntervals
      TestIrSanity
      TestSymbolicExpressions
      TestModules
      TestSections
      TestSymbols
      TestTuple
      TestVariant
  )

  foreach(GTIRB_JAVA_TEST ${GTIRB_JAVA_TESTS})
    add_custom_command(
      TARGET gtirb-java-api
      POST_BUILD
      COMMAND
        ${Java_JAVAC_EXECUTABLE} -cp ${JAR_FILE_LIST}:${JUNIT_STANDALONE_JAR} -d
        ${CMAKE_CURRENT_BINARY_DIR}
        ${CMAKE_CURRENT_BINARY_DIR}/tests/${GTIRB_JAVA_TEST}.java
      COMMENT "Building ${GTIRB_JAVA_TEST}" DEPENDS
              ${CMAKE_CURRENT_BINARY_DIR}/tests/${GTIRB_JAVA_TEST}.java
    )
  endforeach()

  add_test(
    NAME JUnitTests
    COMMAND
      ${Java_JAVA_EXECUTABLE} -ea -jar ${JUNIT_STANDALONE_JAR} execute
      --class-path ${CMAKE_CURRENT_BINARY_DIR}:${JAR_FILE_LIST}
      --scan-class-path
  )

endif()


================================================
FILE: java/Version.java.in
================================================
/*
 *  Copyright (C) 2020 GrammaTech, Inc.
 *
 *  This code is licensed under the MIT license. See the LICENSE file in the
 *  project root for license terms.
 *
 *  This project is sponsored by the Office of Naval Research, One Liberty
 *  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
 *  N68335-17-C-0700.  The content of the information does not necessarily
 *  reflect the position or policy of the Government and no official
 *  endorsement should be inferred.
 *
 */
package com.grammatech.gtirb;

/**
 * The semantic version of this API and version of protobuf this API
 * can read and write from.
 */
public class Version {
        // The semantic version of this API.
	public static final String gtirbApiVersion =
            "@PROJECT_VERSION_MAJOR@." +
            "@PROJECT_VERSION_MINOR@." +
            "@PROJECT_VERSION_PATCH@";
        // The version of Protobuf this API can read and write from.
	public static final int gtirbProtobufVersion =
            @GTIRB_PROTOBUF_VERSION@;
}


================================================
FILE: java/build.gradle
================================================
/* Gradle build for GTIRB Java API
 *
 * NOTE: The supported build system is CMake.
 * This Gradle build exists as a convenience to make it easier to develop in
 * IDEs like IntelliJ, Eclipse, etc.
 *
 * Before running Gradle, generate Protobuf Java sources:
 *   $ protoc --java_out=. --proto-path=proto ../proto/*.proto
 *
 * After IntelliJ import, it may help to add to its .idea/gradle.xml:
 *   <option name="resolveModulePerSourceSet" value="false" />
 */
apply plugin: 'java'

repositories { mavenCentral() }

sourceSets {
    main.java.srcDirs = ['com', "${buildDir}/generated/java"]
    test.java.srcDirs = ['tests']
}

dependencies {
    implementation 'com.google.protobuf:protobuf-java:4.0.0-rc-2'
    testImplementation 'org.junit.jupiter:junit-jupiter-api:5.10.0'
    testImplementation 'org.junit.jupiter:junit-jupiter-params:5.10.0'
    testRuntimeOnly 'org.junit.jupiter:junit-jupiter-engine:5.10.0'
}

compileJava {
    doFirst {
        def pkg = "com/grammatech/gtirb"

        // Read the version information from version.txt
        def versionTxt = new File("${projectDir}/../version.txt")
        def versionMap = [:]
        versionTxt.eachLine { String line ->
                def (name, value) = line.split()
                versionMap[name] = value
        }

        // This version number appears in the output JAR filename
        version = versionMap["VERSION_MAJOR"] + "." +
            versionMap["VERSION_MINOR"] + "." + versionMap["VERSION_PATCH"]

        // Generate Version.java based on the Version.java.in template
        ant.mkdir(dir: "${buildDir}/generated/java/${pkg}/gtirb")
        def newVersion = new File("${buildDir}/generated/java/${pkg}/Version.java")
        def templateVersion = new File("${projectDir}/Version.java.in")
        newVersion.withWriter { def writer ->
            templateVersion.eachLine { def line ->
                def newLine = line
                    .replace("@PROJECT_VERSION_MAJOR@", versionMap["VERSION_MAJOR"])
                    .replace("@PROJECT_VERSION_MINOR@", versionMap["VERSION_MINOR"])
                    .replace("@PROJECT_VERSION_PATCH@", versionMap["VERSION_PATCH"])
                    .replace("@GTIRB_PROTOBUF_VERSION@", versionMap["VERSION_PROTOBUF"])
                writer.write(newLine + "\n");
            }
        }
    }
}

test {
  useJUnitPlatform()
}


================================================
FILE: java/com/grammatech/gtirb/AuxDataContainer.java
================================================
/*
 *  Copyright (C) 2020-2021 GrammaTech, Inc.
 *
 *  This code is licensed under the MIT license. See the LICENSE file in the
 *  project root for license terms.
 *
 *  This project is sponsored by the Office of Naval Research, One Liberty
 *  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
 *  N68335-17-C-0700.  The content of the information does not necessarily
 *  reflect the position or policy of the Government and no official
 *  endorsement should be inferred.
 *
 */

package com.grammatech.gtirb;

import com.google.protobuf.ByteString;
import com.grammatech.gtirb.proto.AuxDataOuterClass;
import java.io.ByteArrayInputStream;
import java.io.ByteArrayOutputStream;
import java.io.IOException;
import java.lang.IllegalArgumentException;
import java.util.Collections;
import java.util.HashMap;
import java.util.Map;
import java.util.Optional;

/**
 * Provides functionality for associating auxiliary
 * data with elements of the intermediate representation.
 */
public abstract class AuxDataContainer extends Node {

    /**
     * Inner class for managing AuxData instances
     */
    public static class AuxData {

        // Always populated.
        private String name;
        private String typeName;

        // Only populated during serialization events.
        // This is considered stale if the schema/decoded members are non-empty.
        private Optional<byte[]> encoded;

        // Only populated if the client adds/gets the AuxData.
        private Optional<AuxDataSchema> schema;
        private Optional<Object> decoded;

        /**
         * Class constructor for AuxData from protobuf {@link AuxData}.
         * @param  protoAuxData   The {@link AuxData} as serialized into a
         *     protocol buffer.
         * @param  name           The name of this {@link AuxData}.
         */
        AuxData(String name, AuxDataOuterClass.AuxData protoAuxData) {
            this.name = name;
            this.typeName = protoAuxData.getTypeName();
            this.encoded = Optional.of(protoAuxData.getData().toByteArray());
            this.schema = Optional.empty();
            this.decoded = Optional.empty();
        }

        /**
         * Class constructor for {@link AuxData} from an in-memory object.
         * @param schema The {@link AuxDataSchema} for the AuxData entry.
         * @param value The value to associate with thie AuxData entry.
         */
        <T> AuxData(AuxDataSchema<T> schema, T value) {
            this.name = schema.getName();
            this.typeName = schema.getCodec().getTypeName();
            this.encoded = Optional.empty();
            this.schema = Optional.of(schema);
            this.decoded = Optional.of(value);
        }

        /**
         * Get the {@link AuxData} name.
         *
         * @return the name.
         */
        public String getName() { return this.name; }

        /**
         * Get the Type String (schemata).
         *
         * @return the type string.
         */
        public String getTypeName() { return this.typeName; }

        /**
         * Get the decoded form of the {@link AuxData}.
         *
         * @param sch The schema used for decoding this {@link AuxData}.
         * @return The decoded data object for this {@link AuxData}.
         */
        public <T> T getDecodedData(AuxDataSchema<T> sch) throws IOException {
            // TODO: Some better way to confirm schema equivalence here.
            // In particular, one could have the correct name and type
            // name but still have an inconsistent type for T. Specifically,
            // we want to test if sch is equivalent to this.schema.get().

            // If this is not true, there's something seriously wrong with
            // the AuxDataContainer code.
            assert this.name.equals(sch.getName());

            // This could be incorrect if the client is using inconsistent
            // schemas with the same schema name.
            if (!this.typeName.equals(sch.getCodec().getTypeName())) {
                throw new IllegalArgumentException(
                    "Schema type names do not match! " + this.typeName +
                    " vs. " + sch.getCodec().getTypeName());
            }

            if (!this.schema.isPresent()) {
                // If we're here because this is the initial get, and the
                // AuxData has not been unserialized yet. Do the decoding now.
                assert this.encoded.isPresent();
                this.schema = Optional.of(sch);
                this.decoded = Optional.of(sch.getCodec().decode(
                    new ByteArrayInputStream(this.encoded.get())));
            }

            return (T)this.decoded.get();
        }

        /**
         * Serialize this AuxData into a protobuf .
         *
         * @return AuxData protocol buffer.
         */
        AuxDataOuterClass.AuxData.Builder toProtobuf() {
            // If we have a schema and decoded object, encode first.
            if (this.schema.isPresent()) {
                assert this.decoded.isPresent();
                ByteArrayOutputStream os = new ByteArrayOutputStream();

                // ByteArrayOutputStream shouldn't ever throw, but
                // because we're passing it through the OutputStream,
                // we have a syntactic obligation to check for throws.
                try {
                    this.schema.get().getCodec().encode(os, this.decoded.get());
                } catch (Exception e) {
                    assert false;
                }

                this.encoded = Optional.of(os.toByteArray());
            } else {
                assert this.encoded.isPresent();
            }
            AuxDataOuterClass.AuxData.Builder protoAuxData =
                AuxDataOuterClass.AuxData.newBuilder();
            protoAuxData.setData(ByteString.copyFrom(this.encoded.get()));
            protoAuxData.setTypeName(this.typeName);
            return protoAuxData;
        }
    }

    protected HashMap<String, AuxData> auxDataMap;

    /**
     * Class constructor for an AuxDataContainer from a protobuf AuxData Map.
     * @param  protoUuid        The UUID of this container.
     * @param  protoAuxDataMap  A Map of AuxData names to protobuf AuxData
     * objects.
     */
    AuxDataContainer(ByteString protoUuid,
                     Map<String, AuxDataOuterClass.AuxData> protoAuxDataMap)
        throws IOException {
        super(Util.byteStringToUuid(protoUuid));
        this.auxDataMap = new HashMap<String, AuxData>();
        if (protoAuxDataMap != null) {
            for (Map.Entry<String, AuxDataOuterClass.AuxData> entry :
                 protoAuxDataMap.entrySet()) {
                AuxData ad = new AuxData(entry.getKey(), entry.getValue());
                auxDataMap.put(ad.getName(), ad);
            }
        }
    }

    AuxDataContainer() {
        super();
        this.auxDataMap = new HashMap<String, AuxData>();
    }

    /**
     * Retrieve an arbitrary {@link AuxData} item from this container if it
     * exists.
     *
     * @param schema The schema for the AuxData
     * @return An {@link AuxData} object, or empty() if not present.
     */
    public <T> Optional<T> getAuxData(AuxDataSchema<T> schema) {
        try {
            AuxData ad = this.auxDataMap.get(schema.getName());

            if (ad == null) {
                return Optional.empty();
            } else {
                return Optional.of(ad.getDecodedData(schema));
            }
        } catch (IOException e) {
            // This can occur when either the serialized content of the AuxData
            // was corrupt or if the schema we're using is incompatible with it.
            // In both cases, treat the the AuxData as not available.
            return Optional.empty();
        }
    }

    /**
     * Adds an arbitrary {@link AuxData} item to this container. If an AuxData
     * already exists with the given schema, then it is overwritten.
     *
     * @param schema The schema to use for the data
     * @param data The data to add
     */
    public <T> void putAuxData(AuxDataSchema<T> schema, T data) {
        AuxData ad = new AuxData(schema, data);
        this.auxDataMap.put(schema.getName(), ad);
    }

    /**
     * Remove an {@link AuxData} from this container.
     *
     * @param schema The schema of the {@link AuxData} to remove.
     * @return False if the {@link AuxData} was not present in the container.
     *     True otherwise.
     */
    public boolean removeAuxData(AuxDataSchema<?> schema) {
        return this.removeAuxData(schema.getName());
    }

    /**
     * Remove an {@link AuxData} from this container.
     *
     * This version of the function can be used for AuxData for which
     * the schema is not known locally.
     *
     * @param name The name of the {@link AuxData} to remove.
     * @return False if the {@link AuxData} was not present in the container.
     *     True otherwise.
     */
    public boolean removeAuxData(String name) {
        AuxData ad = this.auxDataMap.remove(name);
        return ad != null;
    }

    /**
     * Remove all {@link AuxData} from this container.
     */
    public void clearAuxData() { this.auxDataMap.clear(); }

    /**
     * Get a view of the {@link AuxData} entries present in this container.
     *
     * @return An unmodifiable view of the map of {@link AuxData} entries in
     *     this container indexed by name.
     */
    public Map<String, AuxData> getAuxDataMap() {
        return Collections.unmodifiableMap(this.auxDataMap);
    }
}


================================================
FILE: java/com/grammatech/gtirb/AuxDataSchema.java
================================================
package com.grammatech.gtirb;

import com.grammatech.gtirb.auxdatacodec.Codec;

/**
 * This class mediates encoding and decoding of individual AuxData tables.
 *
 * Generally, a single instance should be created for each type of table. That
 * instance is then used to fetch and store content from/to an {@link
 * AuxDataContainer}.
 */
public final class AuxDataSchema<T> {
    private String name;
    private Codec<T> codec;

    /**
     * Constructor.
     *
     * @param name The name of the AuxData table. Each schema should have a
     *     unique name.
     * @param codec The codec governing encoding and decoding.
     */
    public AuxDataSchema(String name, Codec<T> codec) {
        this.name = name;
        this.codec = codec;
    }

    /**
     * Get the name of the AuxData table.
     */
    public String getName() { return this.name; }

    /**
     * Get the codec to be used in encoding/decoding.
     */
    public Codec<T> getCodec() { return this.codec; }
}


================================================
FILE: java/com/grammatech/gtirb/AuxDataSchemas.java
================================================
package com.grammatech.gtirb;

import com.grammatech.gtirb.auxdatacodec.BoolCodec;
import com.grammatech.gtirb.auxdatacodec.ByteCodec;
import com.grammatech.gtirb.auxdatacodec.FloatCodec;
import com.grammatech.gtirb.auxdatacodec.ListCodec;
import com.grammatech.gtirb.auxdatacodec.LongCodec;
import com.grammatech.gtirb.auxdatacodec.MapCodec;
import com.grammatech.gtirb.auxdatacodec.OffsetCodec;
import com.grammatech.gtirb.auxdatacodec.SetCodec;
import com.grammatech.gtirb.auxdatacodec.ShortCodec;
import com.grammatech.gtirb.auxdatacodec.StringCodec;
import com.grammatech.gtirb.auxdatacodec.Tuple1Codec;
import com.grammatech.gtirb.auxdatacodec.Tuple2Codec;
import com.grammatech.gtirb.auxdatacodec.Tuple3Codec;
import com.grammatech.gtirb.auxdatacodec.Tuple4Codec;
import com.grammatech.gtirb.auxdatacodec.Tuple5Codec;
import com.grammatech.gtirb.auxdatacodec.UuidCodec;
import com.grammatech.gtirb.auxdatacodec.Variant11Codec;
import java.util.ArrayList;
import java.util.HashMap;
import java.util.HashSet;
import java.util.List;
import java.util.Map;
import java.util.Set;
import java.util.UUID;

/**
 * This class contains schemas for sanctioned and provisional AuxData tables.
 *
 * Refer to AuxData.md for more information.
 */
public class AuxDataSchemas {

    /* Sanctioned AuxData tables. */

    /**
     * The CodeBlock to which a DT_INIT entry in an ELF file's .dynamic section
     * refers.
     */
    public final static AuxDataSchema<UUID> elfDynamicInit =
        new AuxDataSchema<>("elfDynamicInit", new UuidCodec());

    /**
     * The CodeBlock to which a DT_FINI entry in an ELF file's .dynamic section
     * refers.
     */
    public final static AuxDataSchema<UUID> elfDynamicFini =
        new AuxDataSchema<>("elfDynamicFini", new UuidCodec());

    /**
     * The string value which the DT_SONAME entry in an ELF file's .dynamic
     * section contains.
     */
    public final static AuxDataSchema<String> elfSoname =
        new AuxDataSchema<>("elfSoname", new StringCodec());

    /**
     * Stack executable flag specified by PT_GNU_STACK in ELF files.
     */
    public final static AuxDataSchema<Boolean> elfStackExec =
        new AuxDataSchema<>("elfStackExec", new BoolCodec());

    /**
     * The size of the PT_GNU_STACK segment in ELF files, which may influence
     * the runtime stack size in certain environments.
     */
    public final static AuxDataSchema<Long> elfStackSize =
        new AuxDataSchema<>("elfStackSize", LongCodec.UINT64);

    /**
     * This table identifies all of the {@link CodeBlock}s that belong to each
     * function.
     */
    public final static AuxDataSchema<Map<UUID, Set<UUID>>> functionBlocks =
        new AuxDataSchema<>(
            "functionBlocks",
            new MapCodec<>(new UuidCodec(),
                           new SetCodec<>(new UuidCodec(), HashSet::new),
                           HashMap::new));

    /**
     * This table identifies all {@link CodeBlock}s that represent entry points
     * to each function.
     */
    public final static AuxDataSchema<Map<UUID, Set<UUID>>> functionEntries =
        new AuxDataSchema<>(
            "functionEntries",
            new MapCodec<>(new UuidCodec(),
                           new SetCodec<>(new UuidCodec(), HashSet::new),
                           HashMap::new));

    /**
     * This table identifies a canonical {@link Symbol} to be used for each
     * function.
     */
    public final static AuxDataSchema<Map<UUID, UUID>> functionNames =
        new AuxDataSchema<>(
            "functionNames",
            new MapCodec<>(new UuidCodec(), new UuidCodec(), HashMap::new));

    /**
     * An entry in this table indicates that the given {@link DataBlock}
     * contains content that exhibits the given C++ type.
     */
    public final static AuxDataSchema<Map<UUID, String>> types =
        new AuxDataSchema<>(
            "types",
            new MapCodec<>(new UuidCodec(), new StringCodec(), HashMap::new));

    /**
     * An entry in this table indicates that the given object's address is
     * required to be evenly divisible by the alignment value.
     */
    public final static AuxDataSchema<Map<UUID, Long>> alignment =
        new AuxDataSchema<>(
            "alignment",
            new MapCodec<>(new UuidCodec(), LongCodec.UINT64, HashMap::new));

    /**
     * Comment strings relevant to offsets in the GTIRB entries.
     */
    public final static AuxDataSchema<Map<Offset, String>> comments =
        new AuxDataSchema<>(
            "comments",
            new MapCodec<>(new OffsetCodec(), new StringCodec(), HashMap::new));

    /**
     * A mapping of symbols in one module that are bound dynamically to symbols
     * in another module.
     */
    public final static AuxDataSchema<Map<UUID, UUID>> symbolForwarding =
        new AuxDataSchema<>(
            "symbolForwarding",
            new MapCodec<>(new UuidCodec(), new UuidCodec(), HashMap::new));

    /**
     * Locations of unused padding bytes in the binary.
     */
    public final static AuxDataSchema<Map<Offset, Long>> padding =
        new AuxDataSchema<>(
            "padding",
            new MapCodec<>(new OffsetCodec(), LongCodec.UINT64, HashMap::new));

    /* Provisional AuxData tables. */

    /**
     * Type descriptors representing what type of binary the GTIRB models (e.g.
     * executable vs. dynamic library.)
     */
    public final static AuxDataSchema<List<String>> binaryType =
        new AuxDataSchema<>("binaryType",
                            new ListCodec(new StringCodec(), ArrayList::new));

    /**
     * Map from Offsets to  vector of cfi directives.
     */
    public final static AuxDataSchema<Map<Offset, List<CfiDirective>>>
        cfiDirectives = new AuxDataSchema<>(
            "cfiDirectives",
            new MapCodec<>(
                new OffsetCodec(),
                new ListCodec<>(
                    new Tuple3Codec<>(
                        new StringCodec(),
                        new ListCodec<>(LongCodec.INT64, ArrayList::new),
                        new UuidCodec(), CfiDirective::new),
                    ArrayList::new),
                HashMap::new));

    /**
     * Map from section UUIDs to tuples with the ELF section types and flags.
     */
    public final static AuxDataSchema<Map<UUID, SectionPropertyTuple>>
        sectionProperties = new AuxDataSchema<>(
            "sectionProperties",
            new MapCodec<>(new UuidCodec(),
                           new Tuple2Codec<>(LongCodec.UINT64, LongCodec.UINT64,
                                             SectionPropertyTuple::new),
                           HashMap::new));

    /**
     * Map from symbols to their type, binding, and visibility categories.
     */
    public final static AuxDataSchema<Map<UUID, ElfSymbolInfoTuple>>
        elfSymbolInfo = new AuxDataSchema<>(
            "elfSymbolInfo",
            new MapCodec<>(
                new UuidCodec(),
                new Tuple5Codec<>(LongCodec.UINT64, new StringCodec(),
                                  new StringCodec(), new StringCodec(),
                                  LongCodec.UINT64, ElfSymbolInfoTuple::new),
                HashMap::new));

    /**
     * Table of information about symbol versioning.
     */
    public final static AuxDataSchema<ElfSymbolVersionsTable>
        elfSymbolVersions = new AuxDataSchema<>(
            "elfSymbolVersions",
            new Tuple3Codec<>(
                new MapCodec<>(
                    ShortCodec.UINT16,
                    new Tuple2Codec<>(
                        new ListCodec<>(new StringCodec(), ArrayList::new),
                        ShortCodec.UINT16,
                        ElfSymbolVersionsTable.SymVerDef::new),
                    HashMap::new),
                new MapCodec<>(new StringCodec(),
                               new MapCodec<>(ShortCodec.UINT16,
                                              new StringCodec(), HashMap::new),
                               HashMap::new),
                new MapCodec<>(
                    new UuidCodec(),
                    new Tuple2Codec<>(ShortCodec.UINT16, new BoolCodec(),
                                      ElfSymbolVersionsTable.SymVerEntry::new),
                    HashMap::new),
                ElfSymbolVersionsTable::new));

    /**
     * Map from (typed) data objects to the encoding of the data, expressed as a
     * std::string containing an assembler encoding specifier: "string",
     * "uleb128" or "sleb128".
     */
    public final static AuxDataSchema<Map<UUID, String>> encodings =
        new AuxDataSchema<>(
            "encodings",
            new MapCodec<>(new UuidCodec(), new StringCodec(), HashMap::new));

    /**
     * Map from function UUID to a list of weighted predictions.
     */
    public final static AuxDataSchema<
        Map<String, Map<UUID, List<ProbFuncName>>>> functionNameProbabilities =
        new AuxDataSchema<>(
            "functionNameProbabilities",
            new MapCodec<>(
                new StringCodec(),
                new MapCodec<>(
                    new UuidCodec(),
                    new ListCodec<>(
                        new Tuple3Codec<>(new StringCodec(), new StringCodec(),
                                          new FloatCodec(), ProbFuncName::new),
                        ArrayList::new),
                    HashMap::new),
                HashMap::new));

    /**
     * Names of libraries that are included in an executable (statically linked)
     */
    public final static AuxDataSchema<Map<UUID, String>> includedLibraryNames =
        new AuxDataSchema<>(
            "includedLibraryNames",
            new MapCodec<>(new UuidCodec(), new StringCodec(), HashMap::new));

    /**
     * Versions of libraries that are included in an executable (statically
     * linked)
     */
    public final static AuxDataSchema<Map<UUID, String>>
        includedLibraryVersions = new AuxDataSchema<>(
            "includedLibraryVersions",
            new MapCodec<>(new UuidCodec(), new StringCodec(), HashMap::new));

    /**
     * Names of the external libraries that are needed dynamically at run time.
     */
    public final static AuxDataSchema<List<String>> libraries =
        new AuxDataSchema<>("libraries",
                            new ListCodec<>(new StringCodec(), ArrayList::new));

    /**
     * Paths contained in the rpath of the binary.
     */
    public final static AuxDataSchema<List<String>> libraryPaths =
        new AuxDataSchema<>("libraryPaths",
                            new ListCodec<>(new StringCodec(), ArrayList::new));

    /**
     * List of tuples detailing an exported address, ordinal, and name for PE.
     */
    public final static AuxDataSchema<List<PeExportEntry>> peExportEntries =
        new AuxDataSchema<>(
            "peExportEntries",
            new ListCodec<>(new Tuple3Codec<>(LongCodec.UINT64, LongCodec.INT64,
                                              new StringCodec(),
                                              PeExportEntry::new),
                            ArrayList::new));

    /**
     * UUIDs of the exported symbols for PE.
     */
    public final static AuxDataSchema<List<UUID>> peExportedSymbols =
        new AuxDataSchema<>("peExportedSymbols",
                            new ListCodec<>(new UuidCodec(), ArrayList::new));

    /**
     * List of tuples detailing an imported function address, ordinal, function
     * name, and library names for PE.
     */
    public final static AuxDataSchema<List<PeImportEntry>> peImportEntries =
        new AuxDataSchema<>(
            "peImportEntries",
            new ListCodec<>(new Tuple4Codec<>(LongCodec.UINT64, LongCodec.INT64,
                                              new StringCodec(),
                                              new StringCodec(),
                                              PeImportEntry::new),
                            ArrayList::new));

    /**
     * UUIDs of the imported symbols for PE.
     */
    public final static AuxDataSchema<List<UUID>> peImportedSymbols =
        new AuxDataSchema<>("peImportedSymbols",
                            new ListCodec<>(new UuidCodec(), ArrayList::new));

    /**
     * List of PE resources.
     */
    public final static AuxDataSchema<List<PeResourceEntry>> peResource =
        new AuxDataSchema<>(
            "peResource",
            new ListCodec<>(
                new Tuple3Codec<>(
                    new ListCodec<>(ByteCodec.UINT8, ArrayList::new),
                    new OffsetCodec(), LongCodec.UINT64, PeResourceEntry::new),
                ArrayList::new));

    /**
     * Profiling data. Executions by {@link CodeBlock}
     */
    public final static AuxDataSchema<Map<UUID, Long>> profile =
        new AuxDataSchema<>(
            "profile",
            new MapCodec<>(new UuidCodec(), LongCodec.UINT64, HashMap::new));

    /**
     * Map of function UUIDs to their associated typeTable entries for the
     * purpose of giving them prototypes.
     */
    public final static AuxDataSchema<Map<UUID, UUID>> prototypeTable =
        new AuxDataSchema<>(
            "prototypeTable",
            new MapCodec<>(new UuidCodec(), new UuidCodec(), HashMap::new));

    /**
     * The intra-procedural SCC identifier of each {@link CodeBlock}.
     */
    public final static AuxDataSchema<Map<UUID, Long>> sccs =
        new AuxDataSchema<>(
            "SCCs",
            new MapCodec<>(new UuidCodec(), LongCodec.INT64, HashMap::new));

    /**
     * Map from an Offset of a {@link SymbolicExpression} in a {@link
     * ByteInterval} to its extent, a size in bytes.
     */
    public final static AuxDataSchema<Map<Offset, Long>>
        symbolicExpressionSizes = new AuxDataSchema<>(
            "symbolicExpressionSizes",
            new MapCodec<>(new OffsetCodec(), LongCodec.UINT64, HashMap::new));

    /**
     * Structured type information about objects.
     */
    public final static AuxDataSchema<Map<UUID, TypeTableEntry>> typeTable =
        new AuxDataSchema<>(
            "typeTable",
            new MapCodec<>(
                new UuidCodec(),
                new Variant11Codec<>(
                    LongCodec.UINT64,
                    new Tuple1Codec<>(ByteCodec.UINT8,
                                      TypeTableEntry.BoolType::new),
                    new Tuple2Codec<>(ByteCodec.INT8, LongCodec.UINT64,
                                      TypeTableEntry.IntType::new),
                    LongCodec.UINT64, LongCodec.UINT64,
                    new Tuple2Codec<>(
                        new UuidCodec(),
                        new ListCodec<>(new UuidCodec(), ArrayList::new),
                        TypeTableEntry.FunctionType::new),
                    new UuidCodec(),
                    new Tuple2Codec<>(new UuidCodec(), LongCodec.UINT64,
                                      TypeTableEntry.ArrayType::new),
                    new UuidCodec(),
                    new Tuple2Codec<>(
                        LongCodec.UINT64,
                        new ListCodec<>(
                            new Tuple2Codec<>(LongCodec.UINT64, new UuidCodec(),
                                              TypeTableEntry.StructField::new),
                            ArrayList::new),
                        TypeTableEntry.StructType::new),
                    new Tuple1Codec<>(ByteCodec.UINT8,
                                      TypeTableEntry.VoidType::new),
                    TypeTableEntry::makeUnknown, TypeTableEntry::makeBool,
                    TypeTableEntry::makeInt, TypeTableEntry::makeChar,
                    TypeTableEntry::makeFloat, TypeTableEntry::makeFunction,
                    TypeTableEntry::makePointer, TypeTableEntry::makeArray,
                    TypeTableEntry::makeAlias, TypeTableEntry::makeStruct,
                    TypeTableEntry::makeVoid),
                HashMap::new));
}


================================================
FILE: java/com/grammatech/gtirb/ByteBlock.java
================================================
/*
 *  Copyright (C) 2021 GrammaTech, Inc.
 *
 *  This code is licensed under the MIT license. See the LICENSE file in the
 *  project root for license terms.
 *
 *  This project is sponsored by the Office of Naval Research, One Liberty
 *  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
 *  N68335-17-C-0700.  The content of the information does not necessarily
 *  reflect the position or policy of the Government and no official
 *  endorsement should be inferred.
 *
 */

package com.grammatech.gtirb;

import com.google.protobuf.ByteString;
import com.grammatech.gtirb.proto.ByteIntervalOuterClass;
import java.io.IOException;
import java.util.Optional;
import java.util.OptionalLong;

/**
 * The ByteBlock class is a base class for code blocks and data blocks.
 */
public abstract class ByteBlock extends Node implements TreeListItem {

    private long size;
    private long offset;
    private Optional<ByteInterval> byteInterval;

    /**
     * Class constructor for a ByteBlock from a protobuf byte block.
     * @param  protoBlock     The byte block as serialized into a protocol
     * buffer.
     * @param  size           The size of this ByteBlock in bytes.
     */
    ByteBlock(ByteString protoUuid, ByteIntervalOuterClass.Block protoBlock,
              long size) throws IOException {
        super(Util.byteStringToUuid(protoUuid));
        this.size = size;
        this.offset = protoBlock.getOffset();
        this.byteInterval = Optional.empty();
    }

    /**
     * Class Constructor.
     * @param  size           The number of bytes in this ByteBlock.
     * @param  offset         The offset of this Block in the ByteInterval.
     */
    public ByteBlock(long size, long offset) {
        super();
        this.size = size;
        this.offset = offset;
        this.byteInterval = Optional.empty();
    }

    /**
     * Get the size of this ByteBlock.
     *
     * @return  The number of bytes in this ByteBlock.
     */
    public long getSize() { return this.size; }

    /**
     * Set the size of this ByteBlock.
     *
     * @param newSize    The new size to give to this ByteBlock.
     * @return           The new number of bytes in this ByteBlock.
     */
    public long setSize(long newSize) {
        this.size = newSize;
        return this.size;
    }

    /**
     * Get the offset of this ByteBlock.
     *
     * @return  The difference in address of the beginning of this ByteBlock's
     * ByteInterval and the beginning of this ByteBlock.
     */
    public long getOffset() { return this.offset; }

    /**
     * Get the index to manage this ByteBlock with.
     *
     * This is the index is used for storing and retrieving the ByteBlock, as
     * required by the TreeListItem interface. ByteBlocks are ordered by
     * offset, so this method just returns the offset.
     * @return  The ByteBlock index, which is it's offset.
     */
    public long getIndex() { return this.offset; }

    /**
     * Get the address of this ByteBlock.
     *
     * @return  The ByteBlock address, if the ByteInterval has an address,
     * otherwise null.
     */
    public OptionalLong getAddress() {
        if (this.byteInterval.isEmpty())
            return OptionalLong.empty();
        OptionalLong biAddress = byteInterval.get().getAddress();
        if (!biAddress.isPresent())
            return OptionalLong.empty();
        return OptionalLong.of(biAddress.getAsLong() + offset);
    }

    /**
     * Get the ByteInterval that owns this ByteBlock.
     *
     * @return  The ByteInterval this ByteBlock belongs to. If it does not
     * belong to a ByteInterval, returns null.
     */
    public Optional<ByteInterval> getByteInterval() {
        return this.byteInterval;
    }

    /**
     * Set the ByteInterval that owns this ByteBlock.
     *
     * @param  The ByteInterval this ByteBlock will belong to.
     */
    void setByteInterval(Optional<ByteInterval> byteInterval) {
        this.byteInterval = byteInterval;
    }

    /**
     * Serialize this ByteBlock into a protobuf.
     *
     * This method is intended to be overridden on the base classes.
     *
     * @return Block protocol buffer containing this ByteBlock.
     */
    ByteIntervalOuterClass.Block.Builder toProtobuf() {
        return ByteIntervalOuterClass.Block.newBuilder();
    }
}


================================================
FILE: java/com/grammatech/gtirb/ByteInterval.java
================================================
/*
 *  Copyright (C) 2020-2023 GrammaTech, Inc.
 *
 *  This code is licensed under the MIT license. See the LICENSE file in the
 *  project root for license terms.
 *
 *  This project is sponsored by the Office of Naval Research, One Liberty
 *  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
 *  N68335-17-C-0700.  The content of the information does not necessarily
 *  reflect the position or policy of the Government and no official
 *  endorsement should be inferred.
 *
 */

package com.grammatech.gtirb;

import com.google.protobuf.ByteString;
import com.grammatech.gtirb.proto.ByteIntervalOuterClass;
import com.grammatech.gtirb.proto.SymbolicExpressionOuterClass;
import java.io.IOException;
import java.util.ArrayList;
import java.util.Arrays;
import java.util.Collections;
import java.util.Iterator;
import java.util.List;
import java.util.Map;
import java.util.Optional;
import java.util.OptionalLong;
import java.util.SortedMap;
import java.util.TreeMap;

/**
 * A ByteInterval represents a piece of runtime memory.
 *
 * The ByteInterval class has a size and can store contents as a byte
 * array, Not having a byte array, or having one with a size smaller than
 * the ByteInterval size is allowed, generally this would represent
 * uninitialized memory.
 *
 * The byte blocks (code blocks and data blocks) and symbolic expressions
 * attached to a byte interval reference the memory range it contains,
 * and it may or may not have an assigned address at any one time.
 */
public final class ByteInterval extends Node implements TreeListItem {

    private TreeMap<Long, List<ByteBlock>> blockTree = new TreeMap<>();
    private TreeMap<Long, SymbolicExpression> symbolicExpressionTree =
        new TreeMap<>();
    private OptionalLong address;
    private long size;
    private byte[] bytes;
    private Optional<Section> section;

    /**
     * Class constructor for a ByteInterval from a protobuf byte interval.
     * @param  protoByteInterval  The byte interval as serialized into a
     * protocol buffer.
     */
    private ByteInterval(ByteIntervalOuterClass.ByteInterval protoByteInterval)
        throws IOException {
        super(Util.byteStringToUuid(protoByteInterval.getUuid()));
        this.section = Optional.empty();
        if (protoByteInterval.getHasAddress()) {
            this.address = OptionalLong.of(protoByteInterval.getAddress());
        } else {
            this.address = OptionalLong.empty();
        }

        this.bytes = protoByteInterval.getContents().toByteArray();
        this.size = protoByteInterval.getSize();
        List<ByteIntervalOuterClass.Block> protoBlockList =
            protoByteInterval.getBlocksList();
        for (ByteIntervalOuterClass.Block protoBlock : protoBlockList) {
            ByteBlock newBlock = null;
            // Avoid using protoBlock.hasData() or protoBlock.hasCode() for
            // compatibility with older protobuf versions.
            if (protoBlock.getValueCase() ==
                ByteIntervalOuterClass.Block.ValueCase.DATA) {
                newBlock = DataBlock.fromProtobuf(protoBlock);
            } else if (protoBlock.getValueCase() ==
                       ByteIntervalOuterClass.Block.ValueCase.CODE) {
                newBlock = CodeBlock.fromProtobuf(protoBlock);
            }
            if (newBlock == null) {
                throw new IllegalArgumentException(
                    "Block must be either a CodeBlock or a DataBlock.");
            }
            this.insertByteBlock(newBlock);
        }

        Map<Long, SymbolicExpressionOuterClass.SymbolicExpression>
            protoSymbolicExpressions =
                protoByteInterval.getSymbolicExpressionsMap();
        for (Map.Entry<Long, SymbolicExpressionOuterClass.SymbolicExpression>
                 entry : protoSymbolicExpressions.entrySet()) {
            SymbolicExpressionOuterClass
                .SymbolicExpression protoSymbolicExpression = entry.getValue();

            SymbolicExpression symbolicExpression;
            if (protoSymbolicExpression.getValueCase() ==
                SymbolicExpressionOuterClass.SymbolicExpression.ValueCase
                    .ADDR_CONST) {
                symbolicExpression = new SymAddrConst(protoSymbolicExpression);
            } else if (protoSymbolicExpression.getValueCase() ==
                       SymbolicExpressionOuterClass.SymbolicExpression.ValueCase
                           .ADDR_ADDR) {
                symbolicExpression = new SymAddrAddr(protoSymbolicExpression);
            } else {
                throw new IllegalArgumentException(
                    "Symbolic Expression must be either a SymAddrConst or a SymAddrAddr.");
            }
            this.insertSymbolicExpression(entry.getKey(), symbolicExpression);
        }
    }

    /**
     * Class Constructor.
     * @param  bytes      The array of bytes to be stored in the ByteInterval.
     * @param  address    The address of the ByteInterval.
     */
    public ByteInterval(byte[] bytes, long address) {
        super();
        this.section = Optional.empty();
        this.address = OptionalLong.of(address);
        this.bytes = bytes;
        if (bytes != null) {
            this.size = bytes.length;
        }
    }

    /**
     * Class Constructor.
     * @param  size  The size of the new ByteInterval.
     */
    public ByteInterval(long size) {
        super();
        this.setSize(size);
        this.section = Optional.empty();
        this.address = OptionalLong.empty();
    }

    /**
     * Class Constructor.
     */
    public ByteInterval() {
        super();
        this.section = Optional.empty();
        this.address = OptionalLong.empty();
    }

    /**
     * Get the address of this ByteInterval.
     *
     * @return  An OptionalLong that either is empty or holds a valid address.
     */
    public OptionalLong getAddress() { return this.address; }

    /**
     * Set the address of this ByteInterval.
     *
     * @param address    The new address to give to this ByteInterval
     */
    public void setAddress(long address) {
        this.address = OptionalLong.of(address);
    }

    /**
     * Clears the address of this ByteInterval.
     */
    public void clearAddress() { this.address = OptionalLong.empty(); }

    /**
     * Check that this ByteInterval has an address.
     *
     * @return       <code>true</code> if this ByteInterval has an
     * address; <code>false</code> otherwise.
     */
    public boolean hasAddress() { return address.isPresent(); }

    /**
     * Get the blocks of this ByteInterval.
     *
     * @return  An unmodifiable {@link ByteBlock} list of all the
     * blocks in this {@link ByteInterval}.
     */
    public List<ByteBlock> getBlockList() {
        List<ByteBlock> blockList = new ArrayList<ByteBlock>();
        for (List<ByteBlock> entry : this.blockTree.values()) {
            blockList.addAll(entry);
        }
        return Collections.unmodifiableList(blockList);
    }

    /**
     * Get the size of this ByteBlock.
     *
     * @return  The number of bytes assigned to this ByteInterval.
     */
    public long getSize() { return this.size; }

    /**
     * Set the size of this ByteInterval.
     *
     * If the new size is less than the actual bytes, the byte array will be
     * truncated to the new length.
     *
     * @param size  The new size to give to this ByteInterval.
     */
    public void setSize(long size) {
        if (this.bytes != null && size < this.bytes.length) {
            // Create truncated byte array of the given size
            this.bytes = Arrays.copyOfRange(this.bytes, 0, (int)size);
        }
        this.size = size;
    }

    /**
     * Get the byte array of this ByteInterval.
     *
     * @return  The array of bytes belonging to this ByteInterval.
     */
    public byte[] getBytes() { return this.bytes; }

    /**
     * Set the byte array of this ByteInterval.
     *
     * @param bytes    The new byte array to give to this ByteInterval.
     */
    public void setBytes(byte[] bytes) {
        if (bytes != null && bytes.length > this.size) {
            this.size = bytes.length;
        }
        this.bytes = bytes;
    }

    /**
     * Get the size of this ByteBlock.
     *
     * @return  The number of bytes actually stored in this ByteInterval.
     */
    public long getInitializedSize() {
        if (this.bytes != null)
            return this.bytes.length;
        return 0L;
    }

    /**
     * Get the section this ByteInterval belongs to.
     *
     * @return  The Section that this ByteInterval belongs to, or null if it
     * does not belong to any section.
     */
    public Optional<Section> getSection() { return this.section; }

    /**
     * Set the section this ByteInterval belongs to.
     *
     * @param  The Section that this ByteInterval belongs to, or null if it
     * does not belong to any section.
     */
    void setSection(Optional<Section> section) { this.section = section; }

    /**
     * Get the index to manage this ByteInterval with.
     *
     * This is the index is used for storing and retrieving the ByteInterval, as
     * required by the TreeListItem interface. ByteIntervals are ordered by
     * address, so this method just returns the address.
     * @return  The ByteInterval index, which is it's address.
     */
    public long getIndex() { return this.address.orElse(0); }

    /////////////////////////////////////////////////////////////
    // GENERIC METHODS
    /////////////////////////////////////////////////////////////

    //    // Generic method for retrieving items that intersect with a given
    //    address private <T extends ByteIntervalItem> ArrayList<T>
    //    getItemsIntersectingAddress(long address,
    //                                TreeMap<Long, ArrayList<T>> tree) {
    //        // Address is not valid if it is below the start if this byte
    //        interval. if (this.address == null || address < this.address)
    //            return null;
    //        Long offset = address - this.address;
    //        offset = offset < 0 ? 0L : offset;
    //        ArrayList<T> resultList = new ArrayList<T>();
    //
    //        // Iterate through the blockTree, but leave out those block who
    //        start
    //        // after the searched-for address
    //        SortedMap<Long, ArrayList<T>> subTree = tree.headMap(offset,
    //        true); for (ArrayList<T> itemList : subTree.values()) {
    //            for (T item : itemList) {
    //                long start = item.getOffset();
    //                long end = start + item.getSize();
    //                // Check if this code block overlaps, including end
    //                points:
    //                //    block starts at or below this offset AND
    //                //    block ends at or above this offset
    //                // If so add it to the list.
    //                if (start <= offset && end >= offset) {
    //                    resultList.add(item);
    //                }
    //            }
    //        }
    //        return resultList;
    //    }
    // Might just as well replace all the references to this with the
    // TreeListUtil version Generic method for retrieving items that intersect
    // with a given address
    private <T extends TreeListItem> List<T>
    getItemsIntersectingAddress(long address, TreeMap<Long, List<T>> tree) {
        if (!this.address.isPresent())
            return null;
        long ownAddress = this.address.getAsLong();

        // Address is not valid if it is below the start if this byte interval.
        if (Long.compareUnsigned(address, ownAddress) < 0)
            return null;
        long offset = address - ownAddress;

        return TreeListUtils.getItemsIntersectingIndex(offset, tree);
    }

    // Generic method for retrieving items that intersect with a given address
    // range
    private <T extends TreeListItem> List<T>
    getItemsIntersectingAddressRange(long startAddress, long endAddress,
                                     TreeMap<Long, List<T>> tree) {
        if (!this.address.isPresent())
            return null;
        long ownAddress = this.address.getAsLong();

        // End address cannot be below the start of this ByteInterval
        if (Long.compareUnsigned(endAddress, ownAddress) < 0)
            return null;
        long endOffset = endAddress - ownAddress;

        // Allow ranges that start before this ByteInterval
        long startOffset = 0;
        if (Long.compareUnsigned(startAddress, ownAddress) >= 0) {
            startOffset = startAddress - ownAddress;
        }

        return TreeListUtils.getItemsIntersectingIndexRange(startOffset,
                                                            endOffset, tree);
    }

    // Generic method for retrieving items that start at a given address
    private <T extends TreeListItem> List<T>
    getItemsAtStartAddress(long address, TreeMap<Long, List<T>> tree) {
        if (!this.address.isPresent())
            return null;
        long ownAddress = this.address.getAsLong();

        // Address is not valid if it is below the start of this byte interval.
        if (Long.compareUnsigned(address, ownAddress) < 0)
            return null;
        long offset = address - ownAddress;

        return TreeListUtils.getItemsAtStartIndex(offset, tree);
    }

    // Generic method for retrieving items that start at a given address range
    private <T extends TreeListItem> List<T>
    getItemsAtStartAddressRange(long startAddress, long endAddress,
                                TreeMap<Long, List<T>> tree) {
        if (!this.address.isPresent())
            return null;
        long ownAddress = this.address.getAsLong();

        // Range is not valid if either address falls outside the ByteInterval.
        if (Long.compareUnsigned(startAddress, ownAddress + this.size) > 0 ||
            Long.compareUnsigned(endAddress, ownAddress) < 0)
            return null;

        long startOffset = startAddress - ownAddress;
        long endOffset = endAddress - ownAddress;
        return TreeListUtils.getItemsAtStartIndexRange(startOffset, endOffset,
                                                       tree);
    }

    /////////////////////////////////////////////////////////////
    // BYTEBLOCK METHODS
    /////////////////////////////////////////////////////////////

    /**
     * Insert a block into this ByteInterval.
     *
     * The Block must already have an offset. This will be used to determine
     * where to insert it.
     *
     * @param block    The ByteBlock to add to this ByteInterval.
     * @return         An updated list of blocks at this offset, or null if
     * the insert fails.
     */
    public List<ByteBlock> insertByteBlock(ByteBlock block) {
        List<ByteBlock> blockList;
        Long offset = block.getOffset();
        if (this.blockTree.containsKey(offset))
            blockList = blockTree.get(offset);
        else
            blockList = new ArrayList<ByteBlock>();
        blockList.add(block);
        this.blockTree.put(offset, blockList);
        block.setByteInterval(Optional.of(this));
        return blockList;
    }

    /**
     * Remove a block from this ByteInterval.
     *
     * @param block    The ByteBlock to add to this ByteInterval.
     * @return boolean true if the byte interval contained the block,
     * and it was removed.
     */
    public boolean removeByteBlock(ByteBlock block) {
        if (block.getByteInterval().isEmpty() ||
            block.getByteInterval().get() != this)
            return false;
        Long offset = block.getOffset();
        List<ByteBlock> blockList = this.blockTree.get(offset);
        if (blockList == null)
            // no blocks at this offset
            return false;
        if (!blockList.remove(block))
            // didn't remove, maybe no matching block?
            return false;
        // Did remove, update tree.
        // If the block list is now empty, remove the node from the tree.
        // Otherwise update the tree.
        if (blockList.size() == 0)
            this.blockTree.remove(offset);
        else
            this.blockTree.put(offset, blockList);
        // List empty means did not remove
        if (blockList != null) {
            block.setByteInterval(Optional.empty());
            return true;
        }
        return false;
    }

    /**
     * Get all ByteBlocks at an offset.
     *
     * @param offset      The offset of this ByteBlock from the beginning of the
     * ByteInterval.
     * @return            A list of blocks at this offset, or null if none.
     */
    public List<ByteBlock> findBlocksAtOffset(long offset) {
        return this.blockTree.get(offset);
    }

    /**
     * Get a ByteBlock iterator.
     *
     * @return  An iterator for iterating through all the blocks in this
     * ByteInterval.
     */
    public Iterator<ByteBlock> byteBlockIterator() {
        TreeListUtils<ByteBlock> blockTreeIterator =
            new TreeListUtils<ByteBlock>(this.blockTree);
        return blockTreeIterator.iterator();
    }

    /////////////////////////////////////////////////////////////
    // CODEBLOCK METHODS
    /////////////////////////////////////////////////////////////

    /**
     * Find all the blocks that have bytes that lie within the address
     * specified.
     *
     * @param address      The address to look for.
     * @return             A list of Code Blocks that intersect this address, or
     * null if none.
     */
    public List<CodeBlock> findCodeBlocksOn(long address) {
        List<ByteBlock> foundList =
            getItemsIntersectingAddress(address, this.blockTree);
        if (foundList == null)
            return null;
        List<CodeBlock> resultList = new ArrayList<CodeBlock>();
        for (ByteBlock block : foundList) {
            if (block instanceof CodeBlock)
                resultList.add((CodeBlock)block);
        }
        if (resultList.size() > 0)
            return resultList;
        return null;
    }

    /**
     * Find all the code blocks that have bytes that lie within the addresses
     * specified.
     *
     * @param startAddress      The beginning of the address range to look for.
     * (inclusive)
     * @param endAddress        The last address of the address range to look
     * for. (exclusive)
     * @return                  A list of Code Blocks that intersect this
     * address range, or null if none.
     */
    public List<CodeBlock> findCodeBlocksOn(long startAddress,
                                            long endAddress) {
        List<ByteBlock> foundList = getItemsIntersectingAddressRange(
            startAddress, endAddress, this.blockTree);
        if (foundList == null)
            return null;
        List<CodeBlock> resultList = new ArrayList<CodeBlock>();
        for (ByteBlock block : foundList) {
            if (block instanceof CodeBlock)
                resultList.add((CodeBlock)block);
        }
        if (resultList.size() > 0)
            return resultList;
        return null;
    }

    /**
     * Find all the code blocks that start at an address.
     *
     * @param address      The address to look for.
     * @return             A list of Code Blocks that that start at this
     * address, or null if none.
     */
    public List<CodeBlock> findCodeBlocksAt(long address) {
        List<ByteBlock> foundList =
            getItemsAtStartAddress(address, this.blockTree);
        if (foundList == null)
            return null;
        List<CodeBlock> resultList = new ArrayList<CodeBlock>();
        for (ByteBlock block : foundList) {
            if (block instanceof CodeBlock)
                resultList.add((CodeBlock)block);
        }
        if (resultList.size() > 0)
            return resultList;
        return null;
    }

    /**
     * Find all the code blocks that start between a range of addresses.
     *
     * @param startAddress      The beginning of the address range to look for.
     * (inclusive)
     * @param endAddress        The last address in the address range to look
     *     for.
     * (exclusive)
     * @return                  A list of Code Blocks that that start at this
     * address, or null if none.
     */
    public List<CodeBlock> findCodeBlocksAt(long startAddress,
                                            long endAddress) {
        List<ByteBlock> foundList = getItemsAtStartAddressRange(
            startAddress, endAddress, this.blockTree);
        if (foundList == null)
            return null;
        List<CodeBlock> resultList = new ArrayList<CodeBlock>();
        for (ByteBlock block : foundList) {
            if (block instanceof CodeBlock)
                resultList.add((CodeBlock)block);
        }
        if (resultList.size() > 0)
            return resultList;
        return null;
    }

    /////////////////////////////////////////////////////////////
    // DATABLOCK METHODS
    /////////////////////////////////////////////////////////////

    /**
     * Find all the data blocks that have bytes that lie within the address
     * specified
     *
     * @param address      The address to look for.
     * @return             A list of Data Blocks that intersect this address, or
     * null if none.
     */
    public List<DataBlock> findDataBlocksOn(long address) {
        List<ByteBlock> foundList =
            getItemsIntersectingAddress(address, this.blockTree);
        if (foundList == null)
            return null;
        List<DataBlock> resultList = new ArrayList<DataBlock>();
        for (ByteBlock block : foundList) {
            if (block instanceof DataBlock)
                resultList.add((DataBlock)block);
        }
        if (resultList.size() > 0)
            return resultList;
        return null;
    }

    /**
     * Find all the data blocks that have bytes that lie within the address
     * range specified
     *
     * @param startAddress      The beginning of the address range to look for.
     * (inclusive)
     * @param endAddress        The last address of the address range to look
     * for. (exclusive)
     * @return                  A list of Data Blocks that intersect this
     * address range, or null if none.
     */
    public List<DataBlock> findDataBlocksOn(long startAddress,
                                            long endAddress) {
        List<ByteBlock> foundList = getItemsIntersectingAddressRange(
            startAddress, endAddress, this.blockTree);
        if (foundList == null)
            return null;
        List<DataBlock> resultList = new ArrayList<DataBlock>();
        for (ByteBlock block : foundList) {
            if (block instanceof DataBlock)
                resultList.add((DataBlock)block);
        }
        if (resultList.size() > 0)
            return resultList;
        return null;
    }

    /**
     * Find all the data blocks that start at an address.
     *
     * @param address      The address to look for.
     * @return             A list of Data Blocks that that start at this
     * address, or null if none.
     */
    public List<DataBlock> findDataBlocksAt(long address) {
        List<ByteBlock> foundList =
            getItemsAtStartAddress(address, this.blockTree);
        if (foundList == null)
            return null;
        List<DataBlock> resultList = new ArrayList<DataBlock>();
        for (ByteBlock block : foundList) {
            if (block instanceof DataBlock)
                resultList.add((DataBlock)block);
        }
        if (resultList.size() > 0)
            return resultList;
        return null;
    }

    /**
     * Find all the data blocks that start between a range of addresses.
     *
     * @param startAddress      The beginning of the address range to look for.
     * (inclusive)
     * @param endAddress        The last address in the address to look for.
     * (exclusive)
     * @return                  A list of Data Blocks that that start at this
     * address, or null if none.
     */
    public List<DataBlock> findDataBlocksAt(long startAddress,
                                            long endAddress) {
        List<ByteBlock> foundList = getItemsAtStartAddressRange(
            startAddress, endAddress, this.blockTree);
        if (foundList == null)
            return null;
        List<DataBlock> resultList = new ArrayList<DataBlock>();
        for (ByteBlock block : foundList) {
            if (block instanceof DataBlock)
                resultList.add((DataBlock)block);
        }
        if (resultList.size() > 0)
            return resultList;
        return null;
    }

    /////////////////////////////////////////////////////////////
    // SYMBOLICEXPRESSION METHODS
    /////////////////////////////////////////////////////////////

    /**
     * Insert a symbolic expression into this ByteInterval.
     *
     * @param offset The offset within this ByteInterval at which the address
     * described by this Symbolic Expression belongs; not to be confused with
     * the symbol-relative offset that may be part of a {@link SymAddrConst}.
     * @param symbolicExpression The SymbolicExpression to add to this
     * ByteInterval.
     */
    public void
    insertSymbolicExpression(long offset,
                             SymbolicExpression symbolicExpression) {
        this.symbolicExpressionTree.put(offset, symbolicExpression);
    }

    /**
     * Remove a symbolic expression from this byte interval.
     *
     * @param offset The offset within this {@link ByteInterval} of the
     * {@link SymbolicExpression}.
     * @return boolean true if the byte interval contained the symbolic
     * expression, and it was removed.
     */
    public boolean removeSymbolicExpression(long offset) {
        return (this.symbolicExpressionTree.remove(offset) != null);
    }

    /**
     * Get a SymbolicExpression iterator.
     *
     * @return  An iterator for iterating through the symbolic expressions
     * in this ByteInterval. Each value returned by the iterator is a of type
     * Map.Entry&lt;Long, SymbolicExpression&gt;, where the key is the offset of
     * the SymbolicExpression in the ByteInterval.
     */
    public Iterator<Map.Entry<Long, SymbolicExpression>>
    symbolicExpressionIterator() {
        return this.symbolicExpressionTree.entrySet().iterator();
    }

    /**
     * Find all the symbolic expressions that start at an address.
     *
     * Note that only one symbolic expression can be at any given offset,
     * so this will return at most one SymbolicExpression.
     *
     * @param address      The address to look for.
     * @return             A Symbolic Expression at this address,
     * or null if none.
     */
    public SymbolicExpression findSymbolicExpressionAt(long address) {
        return this.symbolicExpressionTree.get(address);
    }

    /**
     * Find all the symbolic expressions that start between a range of
     * addresses.
     *
     * @param startAddress      The beginning of the address range to look for.
     * (inclusive)
     * @param endAddress        The last address in the address to look for.
     * (exlusive)
     * @return                  An iterator of the set of SymbolicExpressions
     * found, if any, as Map entries, where the key is the offset of the
     * SymbolicExpression in the ByteInterval.
     */
    public Iterator<Map.Entry<Long, SymbolicExpression>>
    findSymbolicExpressionsAt(long startAddress, long endAddress) {
        long start = startAddress;
        long end = endAddress;

        if (endAddress < startAddress) {
            start = endAddress;
            end = startAddress;
        }

        SortedMap<Long, SymbolicExpression> subTree =
            symbolicExpressionTree.subMap(start, end);
        return subTree.entrySet().iterator();
    }

    /**
     * De-serialize a ByteInterval from a protobuf .
     *
     * @param  protoByteInterval  The byte interval as serialized into a
     * protocol buffer.
     * @param  section            The Section that owns this ByteInterval.
     * @return An initialized ByteInterval.
     */
    static ByteInterval
    fromProtobuf(ByteIntervalOuterClass.ByteInterval protoByteInterval)
        throws IOException {
        return new ByteInterval(protoByteInterval);
    }

    /**
     * Serialize this ByteInterval into a protobuf .
     *
     * @return ByteInterval protocol buffer.
     */
    public ByteIntervalOuterClass.ByteInterval.Builder toProtobuf() {
        ByteIntervalOuterClass.ByteInterval.Builder protoByteInterval =
            ByteIntervalOuterClass.ByteInterval.newBuilder();
        protoByteInterval.setUuid(Util.uuidToByteString(this.getUuid()));
        protoByteInterval.setAddress(this.getAddress().orElse(0));
        protoByteInterval.setSize(this.getSize());
        protoByteInterval.setHasAddress(this.hasAddress());

        // Iterate through blocks, adding them
        Iterator<ByteBlock> blocks = this.byteBlockIterator();
        while (blocks.hasNext()) {
            ByteBlock block = blocks.next();
            ByteIntervalOuterClass.Block.Builder protoBlock =
                block.toProtobuf();
            protoByteInterval.addBlocks(protoBlock);
        }

        // Iterate through symbolic expressions, adding them
        for (Map.Entry<Long, SymbolicExpression> symbolicEntry :
             symbolicExpressionTree.entrySet()) {
            SymbolicExpression symbolicExpression = symbolicEntry.getValue();
            SymbolicExpressionOuterClass.SymbolicExpression
                .Builder protoSymbolicExpression =
                symbolicExpression.toProtobuf();
            protoByteInterval.putSymbolicExpressions(
                symbolicEntry.getKey(), protoSymbolicExpression.build());
        }
        if (this.bytes == null) {
            protoByteInterval.setContents(ByteString.EMPTY);
        } else {
            protoByteInterval.setContents(ByteString.copyFrom(this.bytes));
        }
        return protoByteInterval;
    }
}


================================================
FILE: java/com/grammatech/gtirb/CFG.java
================================================
/*
 *  Copyright (C) 2020-2021 GrammaTech, Inc.
 *
 *  This code is licensed under the MIT license. See the LICENSE file in the
 *  project root for license terms.
 *
 *  This project is sponsored by the Office of Naval Research, One Liberty
 *  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
 *  N68335-17-C-0700.  The content of the information does not necessarily
 *  reflect the position or policy of the Government and no official
 *  endorsement should be inferred.
 *
 */

package com.grammatech.gtirb;

import com.google.protobuf.ByteString;
import com.grammatech.gtirb.proto.CFGOuterClass;
import java.io.IOException;
import java.util.ArrayList;
import java.util.List;

/**
 * A CFG represents the interprocedural control flow graph.
 */
public class CFG {

    private List<Edge> edgeList;
    private List<byte[]> verticeList;

    /**
     * Class constructor for a {@link CFG} from a protobuf CFG.
     * @param  protoCfg  The CFG as serialized into a protocol buffer.
     */
    public CFG(CFGOuterClass.CFG protoCfg) throws IOException {
        this.edgeList = new ArrayList<Edge>();
        this.verticeList = new ArrayList<byte[]>();
        for (CFGOuterClass.Edge protoEdge : protoCfg.getEdgesList()) {
            Edge edge = new Edge(protoEdge);
            edgeList.add(edge);
        }
        for (com.google.protobuf.ByteString byteString :
             protoCfg.getVerticesList()) {
            byte[] vertice = byteString.toByteArray();
            verticeList.add(vertice);
        }
    }

    /**
     * Class constructor for a {@link CFG}.
     * @param  edgeList  The edges belonging to to this CFG.
     * @param  verticeList  The vertices belonging to this CFG.
     */
    public CFG(List<Edge> edgeList, List<byte[]> verticeList) {
        this.edgeList = edgeList;
        this.verticeList = verticeList;
    }

    /**
     * Get the {@link Edge} list of a {@link CFG}.
     *
     * @return  The edge list.
     */
    public List<Edge> getEdgeList() { return this.edgeList; }

    /**
     * Set the {@link Edge} list of a {@link CFG}.
     *
     * @param edgeList  The edge list.
     */
    public void setEdgeList(List<Edge> edgeList) { this.edgeList = edgeList; }

    /**
     * Get the vertice list of a {@link CFG}.
     *
     * @return  The vertice list.
     */
    public List<byte[]> getVerticeList() { return this.verticeList; }

    /**
     * Set the vertice list of a {@link CFG}.
     *
     * @param verticeList  The vertice list.
     */
    public void setVerticeList(List<byte[]> verticeList) {
        this.verticeList = verticeList;
    }

    // DEPRECATED
    //    public CFGOuterClass.CFG.Builder buildCFG() {
    //        CFGOuterClass.CFG.Builder newCFG = CFGOuterClass.CFG.newBuilder();
    //        newCFG.mergeFrom(this.protoCfg);
    //        return newCFG;
    //    }

    /**
     * De-serialize a {@link CFG} from a protobuf .
     *
     * @param  protoCFG  The CFG as serialized into a protocol buffer.
     * @return An initialized CFG.
     */
    public static CFG fromProtobuf(CFGOuterClass.CFG protoCFG)
        throws IOException {
        return new CFG(protoCFG);
    }

    /**
     * Serialize this {@link CFG} into a protobuf.
     *
     * @return edge protocol buffer.
     */
    public CFGOuterClass.CFG.Builder toProtobuf() {
        CFGOuterClass.CFG.Builder protoCfg = CFGOuterClass.CFG.newBuilder();

        for (byte[] vertice : this.verticeList)
            protoCfg.addVertices(ByteString.copyFrom(vertice));
        for (Edge edge : this.edgeList)
            protoCfg.addEdges(edge.toProtobuf());
        return protoCfg;
    }
}


================================================
FILE: java/com/grammatech/gtirb/CfiDirective.java
================================================
package com.grammatech.gtirb;

import com.grammatech.gtirb.tuple.Tuple3;
import java.util.List;
import java.util.UUID;

/**
 * A tuple representing an individual CFI directive.
 */
public class CfiDirective extends Tuple3<String, List<Long>, UUID> {
    /**
     * Constructor for a CFI directive.
     *
     * @param name The name of the directive (mnemonic.)
     * @param args Numeric arguments for the directive.
     * @param symbolUuid UUID of the {@link Symbol} indicating where the
     *     directive applies.
     */
    public CfiDirective(String name, List<Long> args, UUID symbolUuid) {
        super(name, args, symbolUuid);
    }

    /**
     * Get the name of the directive (mnemonic.)
     */
    public String getName() { return this.get0(); }

    /**
     * Get the numeric arguments to the directive.
     */
    public List<Long> getArgs() { return this.get1(); }

    /**
     * Get the UUID of the {@link Symbol} indicating where the directive
     * applies.
     */
    public UUID getSymbolUuid() { return this.get2(); }
}


================================================
FILE: java/com/grammatech/gtirb/CodeBlock.java
================================================
/*
 *  Copyright (C) 2020-2021 GrammaTech, Inc.
 *
 *  This code is licensed under the MIT license. See the LICENSE file in the
 *  project root for license terms.
 *
 *  This project is sponsored by the Office of Naval Research, One Liberty
 *  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
 *  N68335-17-C-0700.  The content of the information does not necessarily
 *  reflect the position or policy of the Government and no official
 *  endorsement should be inferred.
 *
 */

package com.grammatech.gtirb;

import com.google.protobuf.ByteString;
import com.grammatech.gtirb.proto.ByteIntervalOuterClass;
import com.grammatech.gtirb.proto.CodeBlockOuterClass;
import java.io.IOException;

/**
 * CodeBlock represents a basic block in the binary.
 */
public class CodeBlock extends ByteBlock {
    /**
     * Variations on decoding a particular ISA
     */
    public enum DecodeMode {
        Default,
        Thumb,
    }

    private DecodeMode decodeMode;

    /**
     * Class constructor for a {@link CodeBlock} from a protobuf CodeBlock.
     * @param  protoBlock  The CodeBlock as serialized into a protocol buffer.
     */
    private CodeBlock(ByteString protoUuid,
                      ByteIntervalOuterClass.Block protoBlock, long size)
        throws IOException {
        super(protoUuid, protoBlock, size);
        assert (protoBlock.getValueCase() ==
                ByteIntervalOuterClass.Block.ValueCase.CODE);
        CodeBlockOuterClass.CodeBlock protoCodeBlock = protoBlock.getCode();
        this.decodeMode =
            DecodeMode.values()[protoCodeBlock.getDecodeModeValue()];
    }

    /**
     * Class constructor for a {@link CodeBlock}.
     */
    public CodeBlock(long size, long offset, DecodeMode decodeMode) {
        super(size, offset);
        this.decodeMode = decodeMode;
    }

    /**
     * Get the decode mode of this {@link ByteBlock}.
     *
     * @return  The decode mode.
     */
    public DecodeMode getDecodeMode() { return decodeMode; }

    /**
     * Set the decode mode of this {@link CodeBlock}.
     *
     * @param decodeMode    The decode mode.
     */
    public void setDecodeMode(DecodeMode decodeMode) {
        this.decodeMode = decodeMode;
    }

    /**
     * De-serialize a {@link CodeBlock} from a protobuf Block.
     *
     * @return An initialized CodeBlock.
     */
    static CodeBlock fromProtobuf(ByteIntervalOuterClass.Block protoBlock)
        throws IOException {
        // Avoid using protoBlock.hasCode() for compatibility with older
        // protobuf
        if (protoBlock.getValueCase() !=
            ByteIntervalOuterClass.Block.ValueCase.CODE) {
            return null;
        }
        CodeBlockOuterClass.CodeBlock protoCodeBlock = protoBlock.getCode();
        return new CodeBlock(protoCodeBlock.getUuid(), protoBlock,
                             protoCodeBlock.getSize());
    }

    /**
     * Serialize this {@link CodeBlock} into a protobuf.
     *
     * @return Block protocol buffer containing this CodeBlock.
     */
    @Override
    ByteIntervalOuterClass.Block.Builder toProtobuf() {
        // The protoBlock is in ByteInterval outer class, and it gets a code
        // block added to it with the setCode() method. So first create the
        // protoBlock, then create the protoCodeBlock and add it to the
        // protoBlock.
        ByteIntervalOuterClass.Block.Builder protoBlock =
            ByteIntervalOuterClass.Block.newBuilder();

        CodeBlockOuterClass.CodeBlock.Builder protoCodeBlock =
            CodeBlockOuterClass.CodeBlock.newBuilder();
        protoCodeBlock.setDecodeModeValue(this.decodeMode.ordinal());
        protoCodeBlock.setUuid(Util.uuidToByteString(this.getUuid()));
        protoCodeBlock.setSize(this.getSize());
        protoBlock.setOffset(this.getOffset());
        protoBlock.setCode(protoCodeBlock);
        return protoBlock;
    }
}


================================================
FILE: java/com/grammatech/gtirb/DataBlock.java
================================================
/*
 *  Copyright (C) 2020-2021 GrammaTech, Inc.
 *
 *  This code is licensed under the MIT license. See the LICENSE file in the
 *  project root for license terms.
 *
 *  This project is sponsored by the Office of Naval Research, One Liberty
 *  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
 *  N68335-17-C-0700.  The content of the information does not necessarily
 *  reflect the position or policy of the Government and no official
 *  endorsement should be inferred.
 *
 */

package com.grammatech.gtirb;

import com.google.protobuf.ByteString;
import com.grammatech.gtirb.proto.ByteIntervalOuterClass;
import com.grammatech.gtirb.proto.DataBlockOuterClass;
import java.io.IOException;

/**
 * DataBlock represents a data object, possibly symbolic.
 */
public class DataBlock extends ByteBlock {

    /**
     * Class constructor for a {@link DataBlock} from a protobuf DataBlock.
     * @param  protoBlock  The DataBlock as serialized into a protocol buffer.
     */
    private DataBlock(ByteString protoUuid,
                      ByteIntervalOuterClass.Block protoBlock, long size)
        throws IOException {
        super(protoUuid, protoBlock, size);
    }

    /**
     * Class constructor for a {@link DataBlock}.
     */
    public DataBlock(long size, long offset) { super(size, offset); }

    /**
     * De-serialize a {@link DataBlock} from a protobuf Block.
     *
     * @return An initialized DataBlock.
     */
    static DataBlock fromProtobuf(ByteIntervalOuterClass.Block protoBlock)
        throws IOException {
        // Avoid using protoBlock.hasData() for compatibility with older
        // protobuf
        if (protoBlock.getValueCase() !=
            ByteIntervalOuterClass.Block.ValueCase.DATA) {
            return null;
        }
        DataBlockOuterClass.DataBlock protoDataBlock = protoBlock.getData();
        return new DataBlock(protoDataBlock.getUuid(), protoBlock,
                             protoDataBlock.getSize());
    }

    /**
     * Serialize this DataBlock into a protobuf.
     *
     * @return Block protocol buffer containing this DataBlock.
     */
    @Override
    ByteIntervalOuterClass.Block.Builder toProtobuf() {
        // The protoBlock is in ByteInterval outer class, and it gets a data
        // block added to it with the setData() method. So first create the
        // protoBlock, then create the protoDataBlock and add it to the
        // protoBlock.
        ByteIntervalOuterClass.Block.Builder protoBlock =
            ByteIntervalOuterClass.Block.newBuilder();

        DataBlockOuterClass.DataBlock.Builder protoDataBlock =
            DataBlockOuterClass.DataBlock.newBuilder();
        protoDataBlock.setUuid(Util.uuidToByteString(this.getUuid()));
        protoDataBlock.setSize(this.getSize());
        protoBlock.setOffset(this.getOffset());
        protoBlock.setData(protoDataBlock);
        return protoBlock;
    }
}


================================================
FILE: java/com/grammatech/gtirb/Edge.java
================================================
/*
 *  Copyright (C) 2020-2021 GrammaTech, Inc.
 *
 *  This code is licensed under the MIT license. See the LICENSE file in the
 *  project root for license terms.
 *
 *  This project is sponsored by the Office of Naval Research, One Liberty
 *  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
 *  N68335-17-C-0700.  The content of the information does not necessarily
 *  reflect the position or policy of the Government and no official
 *  endorsement should be inferred.
 *
 */

package com.grammatech.gtirb;

import com.grammatech.gtirb.proto.CFGOuterClass;
import java.io.IOException;
import java.util.UUID;

/**
 * A CFG Edge represents an edge in the interprocedural control flow graph
 * (CFG).
 */
public class Edge {

    /**
     * Indicates the type of control flow transfer indicated by this edge.
     */
    public enum EdgeType {
        Branch,
        Call,
        Fallthrough,
        Return,
        Syscall,
        Sysret,
        Unlabelled
    }

    private UUID sourceUuid;
    private UUID targetUuid;
    private EdgeType edgeType;
    private boolean edgeLabelConditional;
    private boolean edgeLabelDirect;

    /**
     * Class constructor for an Edge from a protobuf edge.
     * @param  protoEdge  The edge as serialized into a protocol buffer.
     */
    public Edge(CFGOuterClass.Edge protoEdge) throws IOException {
        this.setSourceUuid(Util.byteStringToUuid(protoEdge.getSourceUuid()));
        this.setTargetUuid(Util.byteStringToUuid(protoEdge.getTargetUuid()));
        if (protoEdge.hasLabel()) {
            CFGOuterClass.EdgeLabel protoEdgeLabel = protoEdge.getLabel();
            this.edgeType = EdgeType.values()[protoEdgeLabel.getTypeValue()];
            this.setEdgeLabelConditional(protoEdgeLabel.getConditional());
            this.setEdgeLabelDirect(protoEdgeLabel.getDirect());
        } else {
            this.edgeType = EdgeType.Unlabelled;
        }
    }

    /**
     * Class constructor for an Edge.
     * @param  sourceUuid  UUID of the source node.
     * @param  targetUuid  UUID of the target node.
     * @param  edgeType  The {@link EdgeType}.
     * @param  isConditional  True if the edge id conditional.
     * @param  isDirect  True if the edge is direct.
     */
    public Edge(UUID sourceUuid, UUID targetUuid, EdgeType edgeType,
                boolean isConditional, boolean isDirect) {
        this.setSourceUuid(sourceUuid);
        this.setTargetUuid(targetUuid);
        this.edgeType = edgeType;
        this.edgeLabelConditional = isConditional;
        this.edgeLabelDirect = isDirect;
    }

    /**
     * Get the source node of an {@link Edge}.
     *
     * @return  The edge source node (UUID).
     */
    public UUID getSourceUuid() { return this.sourceUuid; }

    /**
     * Set the source node of an {@link Edge}.
     *
     * @param sourceUuid  The edge source node (UUID).
     */
    public void setSourceUuid(UUID sourceUuid) { this.sourceUuid = sourceUuid; }

    /**
     * Get the target node of an {@link Edge}.
     *
     * @return  The edge target node (UUID).
     */
    public UUID getTargetUuid() { return this.targetUuid; }

    /**
     * Set the target node of an {@link Edge}.
     *
     * @param targetUuid  The edge target node (UUID).
     */
    public void setTargetUuid(UUID targetUuid) { this.targetUuid = targetUuid; }

    /**
     * Get the {@link EdgeType} of an {@link Edge}.
     *
     * @return  The edge type.
     */
    public EdgeType getEdgeType() { return this.edgeType; }

    /**
     * Set the {@link EdgeType} of an {@link Edge}.
     *
     * @param edgeType  The edge type.
     */
    public void setEdgeType(EdgeType edgeType) { this.edgeType = edgeType; }

    /**
     * Whether an {@link Edge}.
     *
     * @return  True if the edge is conditional.
     */
    public boolean isConditional() { return this.edgeLabelConditional; }

    /**
     * Set whether an {@link Edge} is conditional or not.
     *
     * @param conditional  True if the edge is conditional.
     */
    public void setEdgeLabelConditional(boolean conditional) {
        this.edgeLabelConditional = conditional;
    }

    /**
     * Whether an {@link Edge}.
     *
     * @return  True if the edge is direct.
     */
    public boolean isDirect() { return this.edgeLabelDirect; }

    /**
     * Set the name of a {@link Edge}.
     *
     * @param direct  True if the edge is direct.
     */
    public void setEdgeLabelDirect(boolean direct) {
        this.edgeLabelDirect = direct;
    }

    /**
     * De-serialize a {@link Edge} from a protobuf .
     *
     * @param  protoEdge  The edge as serialized into a protocol buffer.
     * @return An initialized Edge.
     */
    public static Edge fromProtobuf(CFGOuterClass.Edge protoEdge)
        throws IOException {
        return new Edge(protoEdge);
    }

    /**
     * Serialize this {@link Edge} into a protobuf.
     *
     * @return edge protocol buffer.
     */
    public CFGOuterClass.Edge.Builder toProtobuf() {
        CFGOuterClass.Edge.Builder protoEdge = CFGOuterClass.Edge.newBuilder();
        if (this.edgeType == EdgeType.Unlabelled) {
            protoEdge.clearLabel();
        } else {
            CFGOuterClass.EdgeLabel.Builder protoEdgeLabel =
                CFGOuterClass.EdgeLabel.newBuilder();
            protoEdgeLabel.setTypeValue(this.edgeType.ordinal());
            protoEdgeLabel.setConditional(this.edgeLabelConditional);
            protoEdgeLabel.setDirect(this.edgeLabelDirect);
            protoEdge.setLabel(protoEdgeLabel);
        }
        protoEdge.setSourceUuid(Util.uuidToByteString(this.sourceUuid));
        protoEdge.setTargetUuid(Util.uuidToByteString(this.targetUuid));
        return protoEdge;
    }
}


================================================
FILE: java/com/grammatech/gtirb/ElfSymbolInfoTuple.java
================================================
package com.grammatech.gtirb;

import com.grammatech.gtirb.tuple.Tuple5;

/**
 * A tuple representing information about a {@link Symbol}.
 */
public class ElfSymbolInfoTuple
    extends Tuple5<Long, String, String, String, Long> {
    /**
     * Constructor.
     *
     * @param size The size of the {@link Symbol}.
     * @param type The type of the {@link Symbol}.
     * @param binding The binding type of the {@link Symbol}.
     * @param visibility What visibility level the {@link Symbol} has.
     * @param secIndex The index of the section the {@link Symbol} resides in.
     */
    public ElfSymbolInfoTuple(Long size, String type, String binding,
                              String visibility, Long secIndex) {
        super(size, type, binding, visibility, secIndex);
    }

    /**
     * Get the size.
     */
    public Long getSize() { return this.get0(); }

    /**
     * Get the type.
     */
    public String getType() { return this.get1(); }

    /**
     * Get the binding type.
     */
    public String getBinding() { return this.get2(); }

    /**
     * Get the visibility level.
     */
    public String getVisibility() { return this.get3(); }

    /**
     * Get the section index.
     */
    public Long getSecIndex() { return this.get4(); }
}


================================================
FILE: java/com/grammatech/gtirb/ElfSymbolVersionsTable.java
================================================
package com.grammatech.gtirb;

import com.grammatech.gtirb.tuple.Tuple2;
import com.grammatech.gtirb.tuple.Tuple3;
import java.util.List;
import java.util.Map;
import java.util.UUID;

/**
 * AuxData table for storing information about symbol versions in ELF files.
 */
public class ElfSymbolVersionsTable
    extends Tuple3<Map<Short, ElfSymbolVersionsTable.SymVerDef>,
                   Map<String, Map<Short, String>>,
                   Map<UUID, ElfSymbolVersionsTable.SymVerEntry>> {

    /**
     * A tuple for storing version strings and verdef flags.
     */
    public static class SymVerDef extends Tuple2<List<String>, Short> {
        /**
         * Constructor.
         *
         * @param versions The list of version strings for a version id.
         * @param verdef Verdef flag associated with a version id.
         */
        public SymVerDef(List<String> versions, Short verdef) {
            super(versions, verdef);
        }

        /**
         * Get the list of version strings.
         */
        public List<String> getVersions() { return this.get0(); }

        /**
         * Get the verdef flag.
         */
        public Short getVerdef() { return this.get1(); }
    }

    /**
     * A tuple for storing symbol version entries.
     */
    public static class SymVerEntry extends Tuple2<Short, Boolean> {
        /**
         * Constructor.
         *
         * @param verId The version id for the entry.
         * @param hidden Flag indicating if the symbol is hidden.
         */
        public SymVerEntry(Short verId, Boolean hidden) {
            super(verId, hidden);
        }

        /**
         * Get the version id.
         */
        public Short getVerId() { return this.get0(); }

        /**
         * True if the symbol is hidden
         */
        public Boolean isHidden() { return this.get1(); }
    }

    /**
     * Constructor.
     *
     * @param symVerDefMap A map of version ids to version definitions.
     * @param symVerNeededMap A map of dynamic library names to maps of symbol
     *     versions they need.
     * @param symVerEntriesMap A map of {@link Symbol} UUIDs to version ids.
     */
    public ElfSymbolVersionsTable(
        Map<Short, ElfSymbolVersionsTable.SymVerDef> symVerDefMap,
        Map<String, Map<Short, String>> symVerNeededMap,
        Map<UUID, ElfSymbolVersionsTable.SymVerEntry> symVerEntriesMap) {
        super(symVerDefMap, symVerNeededMap, symVerEntriesMap);
    }

    /**
     * Get the symbol version definition map.
     */
    public Map<Short, ElfSymbolVersionsTable.SymVerDef> getSymVerDefMap() {
        return this.get0();
    }

    /**
     * Get the map of versions needed by dynamic libraries.
     */
    public Map<String, Map<Short, String>> getVerNeededMap() {
        return this.get1();
    }

    /**
     * Get the symbol version entries map.
     */
    public Map<UUID, ElfSymbolVersionsTable.SymVerEntry> getSymVerEntriesMap() {
        return this.get2();
    }
}


================================================
FILE: java/com/grammatech/gtirb/IR.java
================================================
/*
 *  Copyright (C) 2020-2023 GrammaTech, Inc.
 *
 *  This code is licensed under the MIT license. See the LICENSE file in the
 *  project root for license terms.
 *
 *  This project is sponsored by the Office of Naval Research, One Liberty
 *  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
 *  N68335-17-C-0700.  The content of the information does not necessarily
 *  reflect the position or policy of the Government and no official
 *  endorsement should be inferred.
 *
 */

package com.grammatech.gtirb;

import com.grammatech.gtirb.Module;
import com.grammatech.gtirb.proto.IROuterClass;
import com.grammatech.gtirb.proto.ModuleOuterClass;
import java.io.File;
import java.io.FileInputStream;
import java.io.FileNotFoundException;
import java.io.FileOutputStream;
import java.io.IOException;
import java.io.InputStream;
import java.io.OutputStream;
import java.nio.charset.Charset;
import java.util.ArrayList;
import java.util.Arrays;
import java.util.Collections;
import java.util.List;
import java.util.Optional;

/**
 * A complete internal representation. IR describes the internal representation
 * of a software artifact.
 */
public class IR extends AuxDataContainer {

    private List<Module> modules;
    private CFG cfg;
    private int version; // This is the protobuf version from the protoIr

    static final private byte[] GTIRB_MAGIC_CHARS =
        "GTIRB".getBytes(Charset.forName("ASCII"));
    static final private int GTIRB_MAGIC_LENGTH = 5;

    /**
     * Default class constructor for IR.
     */
    public IR() {
        super();
        this.modules = new ArrayList<Module>();
    }

    /**
     * Class constructor for IR from an IR protobuf.
     * @param  protoIr  The {@link IR} as serialized into a protocol buffer.
     */
    private IR(IROuterClass.IR protoIr) throws IOException {
        super(protoIr.getUuid(), protoIr.getAuxDataMap());
    }

    /**
     * Load IR from protobuf.
     *
     * @return  The {@link IR} loaded from the protobuf.
     */
    private static IR loadProtobuf(IROuterClass.IR protoIr) throws IOException {
        // If no protobuf, can't load it.
        if (protoIr == null)
            return null;
        IR ir = new IR(protoIr);
        ir.version = protoIr.getVersion();
        // Import the modules
        ir.modules = new ArrayList<Module>();
        for (ModuleOuterClass.Module protoModule : protoIr.getModulesList()) {
            Module module = Module.fromProtobuf(protoModule);
            ir.modules.add(module);
        }
        // Import the CFG
        ir.cfg = new CFG(protoIr.getCfg());
        return ir;
    }

    /**
     * Load IR from a protobuf file stream.
     *
     * @return  IR if load is successful, null otherwise.
     */
    public static IR loadFile(InputStream fileIn) {
        byte[] magic = new byte[GTIRB_MAGIC_LENGTH];
        try {
            // Magic signature
            // Bytes 0-4 contain the ASCII characters: GTIRB.
            // Bytes 5-6 are considered reserved for future use and should be 0.
            // Byte 7 contains the GTIRB protobuf spec version in use.
            int bytes_read = fileIn.read(magic);
            if (bytes_read != GTIRB_MAGIC_LENGTH ||
                !Arrays.equals(magic, GTIRB_MAGIC_CHARS)) {
                return null;
            }
            fileIn.skip(2);
            int ver = fileIn.read();
            if (ver != Version.gtirbProtobufVersion) {
                return null;
            }
        } catch (IOException ie) {
            return null;
        }

        IROuterClass.IR protoIr;
        try {
            protoIr = IROuterClass.IR.parseFrom(fileIn);
        } catch (FileNotFoundException fe) {
            return null;
        } catch (IOException ie) {
            return null;
        }
        try {
            IR ir = IR.loadProtobuf(protoIr);
            return ir;
        } catch (IOException ie) {
            return null;
        }
    }

    /**
     * Load IR from a protobuf file.
     *
     * @return  IR if load is successful, null otherwise.
     */
    public static IR loadFile(String fileInName) {
        try {
            File fileIn = new File(fileInName);
            FileInputStream fileInputStream = new FileInputStream(fileIn);
            return loadFile(fileInputStream);
        } catch (Exception e) {
            return null;
        }
    }

    /**
     * Get the list of modules belonging to this {@link IR}.
     *
     * @return  An unmodifiable {@link Module} list of all the
     * modules in this {@link IR}. Any attempt to remove an element of
     * this list will throw an UnsupportedOperationException.
     */
    public List<Module> getModules() {
        return Collections.unmodifiableList(this.modules);
    }

    /**
     * Find modules by name.
     *
     * @return A list of all {@link Module} in this {@link IR} that have a
     * matching name.
     */
    public List<Module> findModules(String name) {
        List<Module> modulesNamed = new ArrayList<Module>();
        for (Module module : this.modules) {
            if (name.equals(module.getName())) {
                modulesNamed.add(module);
            }
        }
        return modulesNamed;
    }

    /**
     * Add a module to this {@link IR}.
     *
     * @param module  {@link Module} to add.
     */
    public void addModule(Module module) {
        this.modules.add(module);
        module.setIr(Optional.of(this));
    }

    /**
     * Add a list of modules to this {@link IR}.
     *
     * @param modules  Modules to add.
     */
    public void addModules(List<Module> modules) {
        for (Module module : modules) {
            this.addModule(module);
        }
    }

    /**
     * Remove a module from this {@link IR}.
     *
     * @param module  {@link Module} to remove.
     * @return boolean true if the IR contained the module and it was removed.
     */
    public boolean removeModule(Module module) {
        if (module.getIr().isPresent() && module.getIr().get() == this &&
            this.modules.remove(module)) {
            module.setIr(Optional.empty());
            return true;
        }
        return false;
    }

    /**
     * Get the CFG belonging to this {@link IR}.
     *
     * @return  A {@link CFG}.
     */
    public CFG getCfg() { return this.cfg; }

    /**
     * Set the CFG belonging to this {@link IR}.
     *
     * @param cfg  A {@link CFG}.
     */
    public void setCfg(CFG cfg) { this.cfg = cfg; }

    /**
     * Get the protobuf version of this {@link IR}.
     *
     * @return Protobuf version.
     */
    public int getVersion() { return this.version; }

    /**
     * Set the protobuf version of this {@link IR}.
     *
     * @param version Protobuf version.
     */
    public void setVersion(int version) { this.version = version; }

    /**
     * Serialize this IR into a protobuf.
     *
     * @return IR protocol buffer.
     */
    public IROuterClass.IR.Builder toProtobuf() {
        IROuterClass.IR.Builder protoIr = IROuterClass.IR.newBuilder();
        protoIr.setUuid(Util.uuidToByteString(this.getUuid()));
        protoIr.setVersion(Version.gtirbProtobufVersion);
        // Add modules
        for (Module module : this.modules) {
            ModuleOuterClass.Module.Builder protoModule = module.toProtobuf();
            protoIr.addModules(protoModule);
        }
        // Add CFG
        if (this.cfg != null) {
            protoIr.setCfg(this.cfg.toProtobuf());
        }
        return protoIr;
    }

    /**
     * Save IR to a protobuf file stream.
     */
    public void saveFile(OutputStream fileOut) throws IOException {
        fileOut.write(GTIRB_MAGIC_CHARS);
        fileOut.write(0);
        fileOut.write(0);
        fileOut.write(Version.gtirbProtobufVersion);

        IROuterClass.IR protoIr = this.toProtobuf().build();
        protoIr.writeTo(fileOut);
    }

    /**
     * Save IR to a protobuf file.
     */
    public void saveFile(String fileOutName) throws IOException {
        File fileOut = new File(fileOutName);
        FileOutputStream fileOutputStream = new FileOutputStream(fileOut);
        this.saveFile(fileOutputStream);
    }
}


================================================
FILE: java/com/grammatech/gtirb/Module.java
================================================
/*
 *  Copyright (C) 2020-2023 GrammaTech, Inc.
 *
 *  This code is licensed under the MIT license. See the LICENSE file in the
 *  project root for license terms.
 *
 *  This project is sponsored by the Office of Naval Research, One Liberty
 *  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
 *  N68335-17-C-0700.  The content of the information does not necessarily
 *  reflect the position or policy of the Government and no official
 *  endorsement should be inferred.
 *
 */

package com.grammatech.gtirb;

import com.grammatech.gtirb.proto.ModuleOuterClass;
import com.grammatech.gtirb.proto.ProxyBlockOuterClass;
import com.grammatech.gtirb.proto.SectionOuterClass;
import com.grammatech.gtirb.proto.SymbolOuterClass;
import java.io.IOException;
import java.util.ArrayList;
import java.util.Collections;
import java.util.Iterator;
import java.util.List;
import java.util.Map;
import java.util.Optional;
import java.util.Set;
import java.util.TreeMap;
import java.util.UUID;

/**
 * Represents a single binary (library or executable),
 */
public class Module extends AuxDataContainer {

    /**
     * 	Identifies an executable file format.
     */
    public enum FileFormat {
        Format_Undefined,
        COFF,
        ELF,
        PE,
        IdaProDb32,
        IdaProDb64,
        XCOFF,
        MACHO,
        RAW
    }

    /**
     * 	Identifies an instruction set architecture.
     */
    public enum ISA {
        ISA_Undefined,
        IA32,
        PPC32,
        X64,
        ARM,
        ValidButUnsupported,
        PPC64,
        ARM64,
        MIPS32,
        MIPS64
    }

    /**
     * 	Identifies a byte ordering (endianness).
     */
    public enum ByteOrder { ByteOrder_Undefined, BigEndian, LittleEndian }

    private Optional<IR> ir;
    private String binaryPath;
    private long preferredAddr;
    private long rebaseDelta;
    private FileFormat fileFormat;
    private ISA isa;
    private String name;
    private TreeMap<Long, List<Section>> sectionTree;
    private List<Symbol> symbolList;
    private List<ProxyBlock> proxyBlockList;
    private CodeBlock entryPoint;
    private ByteOrder byteOrder;

    /**
     * Class constructor for a Module from a protobuf module.
     * @param  protoModule   The module as serialized into a protocol buffer.
     */
    Module(ModuleOuterClass.Module protoModule) throws IOException {
        super(protoModule.getUuid(), protoModule.getAuxDataMap());
        this.ir = Optional.empty();
        this.binaryPath = protoModule.getBinaryPath();
        this.preferredAddr = protoModule.getPreferredAddr();
        this.rebaseDelta = protoModule.getRebaseDelta();
        this.fileFormat = FileFormat.values()[protoModule.getFileFormatValue()];
        this.isa = ISA.values()[protoModule.getIsaValue()];
        this.name = protoModule.getName();
        this.byteOrder = ByteOrder.values()[protoModule.getByteOrderValue()];

        initializeSectionList(protoModule.getSectionsList());
        initializeSymbolList(protoModule.getSymbolsList());
        initializeProxyBlockList(protoModule.getProxiesList());

        // Sections must be initialized before looking up the entry point
        UUID entryUUID = Util.byteStringToUuid(protoModule.getEntryPoint());
        Node entryNode = Node.getByUuid(entryUUID);
        if (entryNode instanceof CodeBlock)
            this.entryPoint = (CodeBlock)entryNode;
    }

    /**
     * Class Constructor.
     * @param  binaryPath       The binary path of this Module.
     * @param  preferredAddr    The preferred address of this Module.
     * @param  rebaseDelta      The rebase delta of this Module.
     * @param  fileFormat       The file format of this Module.
     * @param  isa              The ISA of this Module.
     * @param  name             The name of this Module.
     * @param  sections         A list of Sections belonging to this Module.
     * @param  symbols          A list of Symbols belonging to this Module.
     * @param  proxyBlocks      A list of ProxyBlocks belonging to this Module.
     * @param  entryPoint       The entry point of this module or null.
     */
    public Module(String binaryPath, long preferredAddr, long rebaseDelta,
                  FileFormat fileFormat, ISA isa, String name,
                  List<Section> sections, List<Symbol> symbols,
                  List<ProxyBlock> proxyBlocks, CodeBlock entryPoint) {
        super();
        this.ir = Optional.empty();
        this.binaryPath = binaryPath;
        this.preferredAddr = preferredAddr;
        this.rebaseDelta = rebaseDelta;
        this.fileFormat = fileFormat;
        this.isa = isa;
        this.name = name;
        this.entryPoint = entryPoint;
        this.setSymbols(symbols);
        this.setProxyBlocks(proxyBlocks);
        this.setSections(sections);
    }

    /**
     * Class Constructor for a minimal module with no sections, symbols, or
     * proxyBlocks.
     * @param  binaryPath       The binary path of this Module.
     * @param  preferredAddr    The preferred address of this Module.
     * @param  rebaseDelta      The rebase delta of this Module.
     * @param  fileFormat       The file format of this Module.
     * @param  isa              The ISA of this Module.
     * @param  name             The name of this Module.
     */
    public Module(String binaryPath, long preferredAddr, long rebaseDelta,
                  FileFormat fileFormat, ISA isa, String name) {
        super();
        this.ir = Optional.empty();
        this.binaryPath = binaryPath;
        this.preferredAddr = preferredAddr;
        this.rebaseDelta = rebaseDelta;
        this.fileFormat = fileFormat;
        this.isa = isa;
        this.name = name;
        this.symbolList = new ArrayList<Symbol>();
        this.sectionTree = new TreeMap<Long, List<Section>>();
        this.proxyBlockList = new ArrayList<ProxyBlock>();
        this.entryPoint = null;
    }

    /**
     * Get the {@link IR} this Module belongs to.
     *
     * @return  An Optional that contains the IR this module belongs to,
     * or empty if it does not belong to an IR.
     */
    public Optional<IR> getIr() { return this.ir; }

    /**
     * Set the {@link IR} this Module belongs to.
     *
     * @param  An Optional that contains the IR this module will belongs
     * to, or empty if it should not belong to an IR.
     */
    void setIr(Optional<IR> ir) { this.ir = ir; }

    /**
     * Get the location of the corresponding binary on disk.
     *
     * @return  The path to the corresponding binary on disk.
     */
    public String getBinaryPath() { return this.binaryPath; }

    /**
     * Set the location of the corresponding binary on disk.
     *
     * This is for informational purposes only and will not be
     * used to open the image, so it does not need to be the path
     * of an existing file.
     *
     * @param binaryPath    The path name to use.
     */
    public void setBinaryPath(String binaryPath) {
        this.binaryPath = binaryPath;
    }

    /**
     * Get the preferred address for loading this module.
     *
     * @return  The preferred address.
     */
    public long getPreferredAddr() { return this.preferredAddr; }

    /**
     * Set the preferred address for loading this module.
     *
     * @param preferredAddr  The module preferred address.
     */
    public void setPreferredAddr(long preferredAddr) {
        this.preferredAddr = preferredAddr;
    }

    /**
     * Get the difference between this module's preferred address and the
     * address where it was actually loaded.
     *
     * @return  The rebase delta.
     */
    public long getRebaseDelta() { return this.rebaseDelta; }

    /**
     * Set the difference between this module's preferred address and the
     * address where it was actually loaded.
     *
     * @param rebaseDelta    The module rebase delta.
     */
    public void setRebaseDelta(long rebaseDelta) {
        this.rebaseDelta = rebaseDelta;
    }

    /**
     * Get the format of the binary pointed to by getBinaryPath().
     *
     * @return  The format of the binary associated with this module, as a
     * {@link FileFormat} enumerator.
     */
    public FileFormat getFileFormat() { return this.fileFormat; }

    /**
     * Set the file format of this Module.
     *
     * @param fileFormat    The module file format.
     */
    public void setFileFormat(FileFormat fileFormat) {
        this.fileFormat = fileFormat;
    }

    /**
     * Get the ISA of the instructions in this Module.
     *
     * @return  The module {@link ISA}.
     */
    public ISA getIsa() { return this.isa; }

    /**
     * Set the ISA of the instructions in this Module.
     *
     * @param isa    The module {@link ISA}.
     */
    public void setIsa(ISA isa) { this.isa = isa; }

    /**
     * Get the name of this Module.
     *
     * @return  The module name.
     */
    public String getName() { return this.name; }

    /**
     * Set the name of this Module.
     *
     * @param name    The module name.
     */
    public void setName(String name) { this.name = name; }

    /**
     * Get the sections of this Module.
     *
     * @return  An unmodifiable {@link Section} list of all the
     * sections in this {@link Module}.
     */
    public List<Section> getSections() {
        List<Section> sectionList = new ArrayList<Section>();
        for (List<Section> entry : this.sectionTree.values()) {
            sectionList.addAll(entry);
        }
        return Collections.unmodifiableList(sectionList);
    }

    /**
     * Set the section list of this Module.
     *
     * @param sectionList    The module section list.
     */
    private void setSections(List<Section> sectionList) {
        if (sectionTree == null) {
            sectionTree = new TreeMap<Long, List<Section>>();
        } else {
            sectionTree.clear();
        }
        for (Section section : sectionList) {
            TreeListUtils.insertItem(section, sectionTree);
            section.setModule(Optional.of(this));
        }
    }

    /**
     * Add a section to this Module.
     *
     * @param section  The {@link Section} to add.
     */
    public void addSection(Section section) {
        TreeListUtils.insertItem(section, this.sectionTree);
        section.setModule(Optional.of(this));
    }

    /**
     * Remove a section from this Module.
     *
     * @param section  The {@link Section} to remove.
     * @return boolean true if the Module contained the section, and it was
     * removed.
     */
    public boolean removeSection(Section section) {
        if (section.getModule().isPresent() &&
            section.getModule().get() == this) {
            TreeListUtils.removeItem(section, this.sectionTree);
            section.setModule(Optional.empty());
            return true;
        } else
            return false;
    }

    /**
     * Get the symbols of this Module.
     *
     * @return  An unmodifiable {@link Symbol} list of all the
     * symbols in this {@link Module}.
     */
    public List<Symbol> getSymbols() {
        return Collections.unmodifiableList(this.symbolList);
    }

    /**
     * Add a symbol to this Module.
     *
     * @param symbol  The {@link Symbol} to add to this {@link Module}.
     */
    public void addSymbol(Symbol symbol) {
        this.symbolList.add(symbol);
        symbol.setModule(Optional.of(this));
    }

    /**
     * Remove a symbol from this Module.
     *
     * @param symbol  The {@link Symbol} to remove from this {@link Module}.
     * @return boolean true if the Module contained the symbol, and it was
     * removed.
     */
    public boolean removeSymbol(Symbol symbol) {
        if (symbol.getModule().isPresent() &&
            symbol.getModule().get() == this &&
            this.symbolList.remove(symbol)) {
            symbol.setModule(Optional.empty());
            return true;
        } else
            return false;
    }

    /**
     * Set the symbol list of this Module.
     *
     * @param symbolList    The module symbol list.
     */
    private void setSymbols(List<Symbol> symbolList) {
        if (this.symbolList == null) {
            this.symbolList = new ArrayList<Symbol>();
        }
        for (Symbol symbol : symbolList)
            this.addSymbol(symbol);
    }

    /**
     * Get a list of proxy blocks in this Module.
     *
     * @return  An unmodifiable {@link ProxyBlock} list of all the
     * proxy blocks in this {@link Module}.
     */
    public List<ProxyBlock> getProxyBlocks() {
        return Collections.unmodifiableList(this.proxyBlockList);
    }

    /**
     * Add a proxy block to this Module.
     *
     * @param proxyBlock    The {@link ProxyBlock} to add to this {@link
     * Module}.
     */
    public void addProxyBlock(ProxyBlock proxyBlock) {
        this.proxyBlockList.add(proxyBlock);
        proxyBlock.setModule(Optional.of(this));
    }

    /**
     * Remove a proxy block from this Module.
     *
     * @param proxyBlock    The {@link ProxyBlock} to remove from this {@link
     * Module}.
     * @return boolean true if the Module contained the proxy block, and it was
     * removed.
     */
    public boolean removeProxyBlock(ProxyBlock proxyBlock) {
        if (proxyBlock.getModule().isPresent() &&
            proxyBlock.getModule().get() == this &&
            this.proxyBlockList.remove(proxyBlock)) {
            proxyBlock.setModule(Optional.empty());
            return true;
        } else
            return false;
    }

    /**
     * Set the proxy block list of this Module.
     *
     * @param proxyBlockList    The module proxyBlock list.
     */
    private void setProxyBlocks(List<ProxyBlock> proxyBlockList) {
        if (this.proxyBlockList == null) {
            this.proxyBlockList = new ArrayList<ProxyBlock>();
        }
        for (ProxyBlock proxyBlock : proxyBlockList)
            this.addProxyBlock(proxyBlock);
    }

    /**
     * Get the entry point of this module, or null if not present.
     *
     * @return  The module entry point (a code block) or null if no entry is
     * point has been designated.
     */
    public CodeBlock getEntryPoint() { return entryPoint; }

    /**
     * Set the entry point of this Module.
     *
     * @param entryCodeBlock    The module entry point (a {@link CodeBlock}).
     */
    public void setEntryPoint(CodeBlock entryCodeBlock) {
        this.entryPoint = entryCodeBlock;
    }

    /**
     * Get the ByteOrder of this Module.
     *
     * @return  The module byte order (endianness).
     */
    public ByteOrder getByteOrder() { return this.byteOrder; }

    /**
     * Set the byte order of this Module.
     *
     * @param  byteOrder    The module byte order (endianness).
     */
    public void setByteOrder(ByteOrder byteOrder) {
        this.byteOrder = byteOrder;
    }

    /**
     * Initialize this module's sections from section protocol buffers
     *
     * When creating a Module from a protocol buffer module, use this method to
     * initialize the sections belonging to this module from the protocol
     * buffers of those sections.
     *
     */
    private void
    initializeSectionList(List<SectionOuterClass.Section> protoSectionList)
        throws IOException {
        this.sectionTree = new TreeMap<>();
        // For each section, add to sectionList in this class
        for (SectionOuterClass.Section protoSection : protoSectionList) {
            Section newSection = Section.fromProtobuf(protoSection);
            this.addSection(newSection);
        }
    }

    /**
     * Initialize this module's symbols from symbol protocol buffers
     *
     * When creating a Module from a protocol buffer module, use this method to
     * initialize the symbols belonging to this module from the protocol
     * buffers of those symbols.
     *
     */
    private void
    initializeSymbolList(List<SymbolOuterClass.Symbol> protoSymbolList)
        throws IOException {
        this.symbolList = new ArrayList<Symbol>();
        // For each symbol, add to symbolList in this class
        for (SymbolOuterClass.Symbol protoSymbol : protoSymbolList) {
            Symbol newSymbol = Symbol.fromProtobuf(protoSymbol);
            this.addSymbol(newSymbol);
        }
    }

    /**
     * Initialize this module's proxy blocks from proxy block protocol buffers
     *
     * When creating a Module from a protocol buffer module, use this method to
     * initialize the proxy blocks belonging to this module from the protocol
     * buffers of those proxy blocks.
     *
     */
    private void initializeProxyBlockList(
        List<ProxyBlockOuterClass.ProxyBlock> protoProxyBlockList)
        throws IOException {
        this.proxyBlockList = new ArrayList<ProxyBlock>();
        // For each proxy block, add to proxyBlockList in this class
        for (ProxyBlockOuterClass.ProxyBlock protoProxyBlock :
             protoProxyBlockList) {
            ProxyBlock newProxyBlock =
                ProxyBlock.fromProtobuf(protoProxyBlock, this);
            this.addProxyBlock(newProxyBlock);
        }
    }

    /**
     * Find all the sections that have bytes that intersect with the address
     * specified.
     *
     * @param address      The address to look for.
     * @return             A list of {@link Section} objects that intersect this
     * address, or empty list if none.
     */
    public List<Section> findSectionsOn(long address) {
        return TreeListUtils.getItemsIntersectingIndex(address,
                                                       this.sectionTree);
    }

    /**
     * Find all the sections that have bytes that intersect with the address
     * range specified.
     *
     * @param startAddress      The beginning of the address range to look for.
     * (inclusive)
     * @param endAddress        The last address of the address range to look
     * for. (exclusive)
     * @return                  A list of {@link Section} objects that intersect
     * this address range, or empty list if none.
     */
    public List<Section> findSectionsOn(long startAddress, long endAddress) {
        return TreeListUtils.getItemsIntersectingIndexRange(
            startAddress, endAddress, this.sectionTree);
    }

    /**
     * Find all the sections that start at an address.
     *
     * @param address      The address to look for.
     * @return             A list of {@link Section} objects that start at the
     * address.
     */
    public List<Section> findSectionsAt(long address) {
        return TreeListUtils.getItemsAtStartIndex(address, this.sectionTree);
    }

    /**
     * Find all the sections that start between a range of addresses.
     *
     * @param startAddress      The beginning of the address range to look for.
     * (inclusive)
     * @param endAddress        The last address in the address to look for.
     * (exclusive)
     * @return                  A list of {@link Section} objects that that
     * start at this address, or null if none.
     */
    public List<Section> findSectionsAt(long startAddress, long endAddress) {
        return TreeListUtils.getItemsAtStartIndexRange(startAddress, endAddress,
                                                       this.sectionTree);
    }

    /**
     * De-serialize this Module from a protobuf .
     *
     * @param  protoModule   The module as serialized into a protocol buffer.
     * @return An initialized Module.
     */
    static Module fromProtobuf(ModuleOuterClass.Module protoModule)
        throws IOException {
        return new Module(protoModule);
    }

    /**
     * Serialize this Module into a protobuf .
     *
     * @return Module protocol buffer.
     */
    ModuleOuterClass.Module.Builder toProtobuf() {
        ModuleOuterClass.Module.Builder protoModule =
            ModuleOuterClass.Module.newBuilder();
        protoModule.setUuid(Util.uuidToByteString(this.getUuid()));
        protoModule.setBinaryPath(this.getBinaryPath());
        protoModule.setPreferredAddr(this.getPreferredAddr());
        protoModule.setRebaseDelta(this.getRebaseDelta());
        // The enums values are mapped one-to-one
        protoModule.setFileFormatValue(this.fileFormat.ordinal());
        protoModule.setIsaValue(this.isa.ordinal());
        protoModule.setName(this.getName());
        if (this.byteOrder != null) {
            protoModule.setByteOrderValue(this.byteOrder.ordinal());
        }
        CodeBlock entryPoint = this.getEntryPoint();
        if (entryPoint != null) {
            protoModule.setEntryPoint(
                Util.uuidToByteString(this.getEntryPoint().getUuid()));
        }
        // Add collections by calling toProtobuf on each item
        for (Symbol symbol : this.symbolList)
            protoModule.addSymbols(symbol.toProtobuf());
        for (ProxyBlock proxyBlock : this.proxyBlockList)
            protoModule.addProxies(proxyBlock.toProtobuf());
        Iterator<Section> sectionIterator =
            new TreeListUtils<Section>(this.sectionTree).iterator();
        while (sectionIterator.hasNext()) {
            Section section = sectionIterator.next();
            protoModule.addSections(section.toProtobuf());
        }
        // Add auxData by calling toProtobuf on each type
        // TODO: Can this be done by AuxDataContainer, itself?
        // Doing it here, we have to access the protected member AuxDataMap
        // from the container.
        for (Map.Entry<String, AuxData> entry : this.auxDataMap.entrySet()) {
            protoModule.putAuxData(entry.getKey(),
                                   entry.getValue().toProtobuf().build());
        }
        return protoModule;
    }
}


================================================
FILE: java/com/grammatech/gtirb/Node.java
================================================
/*
 *  Copyright (C) 2020-2021 GrammaTech, Inc.
 *
 *  This code is licensed under the MIT license. See the LICENSE file in the
 *  project root for license terms.
 *
 *  This project is sponsored by the Office of Naval Research, One Liberty
 *  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
 *  N68335-17-C-0700.  The content of the information does not necessarily
 *  reflect the position or policy of the Government and no official
 *  endorsement should be inferred.
 *
 */

package com.grammatech.gtirb;

import java.lang.ref.WeakReference;
import java.util.HashMap;
import java.util.UUID;

/**
 * Node is the root class for many GTIRB components.
 */
public class Node {
    private final UUID uuid;
    private static HashMap<UUID, WeakReference<Node>> uuid_cache =
        new HashMap<UUID, WeakReference<Node>>();

    /**
     * Create a Node with a randomly generated UUID.
     */
    public Node() { this(UUID.randomUUID()); }

    /**
     * Create a Node with a specified UUID.
     */
    public Node(UUID uuid) {
        this.uuid = uuid;
        uuid_cache.put(uuid, new WeakReference<>(this));
    }

    /**
     * Find a node using its UUID.
     *
     * @return  The node with the given UUID.
     */
    public static Node getByUuid(UUID uuid) {
        WeakReference<Node> noderef = uuid_cache.get(uuid);
        if (noderef != null)
            return noderef.get();
        return null;
    }

    /**
     * Find a node of the given type by UUID.
     *
     * @return  The node with the given UUID.
     */
    public static <T extends Node> T getByUuid(UUID uuid, Class<T> type) {
        WeakReference<Node> noderef = uuid_cache.get(uuid);
        if (noderef != null) {
            Node node = noderef.get();
            if (type.isInstance(node)) {
                return type.cast(node);
            }
        }
        return null;
    }

    /**
     * Get the UUID of this node.
     *
     * @return  The UUID.
     */
    public UUID getUuid() { return uuid; }
}


================================================
FILE: java/com/grammatech/gtirb/Offset.java
================================================
/*
 *  Copyright (C) 2020-2021 GrammaTech, Inc.
 *
 *  This code is licensed under the MIT license. See the LICENSE file in the
 *  project root for license terms.
 *
 *  This project is sponsored by the Office of Naval Research, One Liberty
 *  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
 *  N68335-17-C-0700.  The content of the information does not necessarily
 *  reflect the position or policy of the Government and no official
 *  endorsement should be inferred.
 *
 */

package com.grammatech.gtirb;

import java.util.UUID;

/**
 * An Offset describes a location inside a {@link CodeBlock} or {@link
 * DataBlock}.
 */
public class Offset {

    private UUID elementId;
    private long displacement;

    /**
     * Constructor
     *
     * @param elementId  The UUID of a {@link ByteBlock} containing the location
     * of interest.
     * @param displacement  The offset inside the Node to point to.
     */
    public Offset(UUID elementId, long displacement) {
        this.elementId = elementId;
        this.displacement = displacement;
    }

    /**
     * Get the UUID of the block this {@link Offset} points to.
     *
     * @return  The element UUID.
     */
    public UUID getElementId() { return this.elementId; }

    /**
     * Get the displacement into the block this {@link Offset} points to.
     *
     * @return  The displacement.
     */
    public long getDisplacement() { return this.displacement; }

    @Override
    public boolean equals(Object o) {
        if (o == this) {
            return true;
        }

        if (!(o instanceof Offset)) {
            return false;
        }

        Offset off = (Offset)o;
        return this.elementId.equals(off.elementId) &&
            this.displacement == off.displacement;
    }
}


================================================
FILE: java/com/grammatech/gtirb/PeExportEntry.java
================================================
package com.grammatech.gtirb;

import com.grammatech.gtirb.tuple.Tuple3;

/**
 * A tuple storing information about a PE file export entry.
 */
public class PeExportEntry extends Tuple3<Long, Long, String> {
    /**
     * Constructor.
     *
     * @param address The address of the export.
     * @param ordinal The ordinal of the export.
     * @param name The name of the export.
     */
    public PeExportEntry(Long address, Long ordinal, String name) {
        super(address, ordinal, name);
    }

    /**
     * Get the address.
     */
    public Long getAddress() { return this.get0(); }

    /**
     * Get the ordinal.
     */
    public Long getOrdinal() { return this.get1(); }

    /**
     * Get the name.
     */
    public String getName() { return this.get2(); }
}


================================================
FILE: java/com/grammatech/gtirb/PeImportEntry.java
================================================
package com.grammatech.gtirb;

import com.grammatech.gtirb.tuple.Tuple4;

/**
 * A tuple representing an import entry for a PE file.
 */
public class PeImportEntry extends Tuple4<Long, Long, String, String> {
    /**
     * Constructor.
     *
     * @param address The address of the imported symbol.
     * @param ordinal The ordinal of the imported symbol.
     * @param funcName The name of the imported symbol.
     * @param libName The name of the library the symbol is imported from.
     */
    public PeImportEntry(Long address, Long ordinal, String funcName,
                         String libName) {
        super(address, ordinal, funcName, libName);
    }

    /**
     * Get the address.
     */
    public Long getAddress() { return this.get0(); }

    /**
     * Get the ordinal.
     */
    public Long getOrdinal() { return this.get1(); }

    /**
     * Get the function name.
     */
    public String getFuncName() { return this.get2(); }

    /**
     * Get the library name.
     */
    public String getLibName() { return this.get3(); }
}


================================================
FILE: java/com/grammatech/gtirb/PeResourceEntry.java
================================================
package com.grammatech.gtirb;

import com.grammatech.gtirb.Offset;
import com.grammatech.gtirb.tuple.Tuple3;
import java.util.List;

/**
 * A tuple representing a resource attached to a PE file.
 */
public class PeResourceEntry extends Tuple3<List<Byte>, Offset, Long> {
    /**
     * Constructor.
     *
     * @param header The resource header.
     * @param offset Where the resource is located.
     * @param size The size of the resource data.
     */
    public PeResourceEntry(List<Byte> header, Offset offset, Long size) {
        super(header, offset, size);
    }

    /**
     * Get the header.
     */
    public List<Byte> getHeader() { return this.get0(); }

    /**
     * Get the offset.
     */
    public Offset getOffset() { return this.get1(); }

    /**
     * Get the size.
     */
    public Long getSize() { return this.get2(); }
}


================================================
FILE: java/com/grammatech/gtirb/ProbFuncName.java
================================================
package com.grammatech.gtirb;

import com.grammatech.gtirb.tuple.Tuple3;

/**
 * A tuple representing a probability fact associated with a function's name.
 */
public class ProbFuncName extends Tuple3<String, String, Float> {

    /**
     * Constructor.
     *
     * @param name Source-level function name.
     * @param binaryName Binary-level function name.
     * @param prob The probability associated with the names.
     */
    public ProbFuncName(String name, String binaryName, Float prob) {
        super(name, binaryName, prob);
    }

    /**
     * Get the source-level name.
     */
    public String getName() { return this.get0(); }

    /**
     * Get the binary-level name.
     */
    public String getBinaryName() { return this.get1(); }

    /**
     * Get the probability.
     */
    public Float getProbability() { return this.get2(); }
}


================================================
FILE: java/com/grammatech/gtirb/ProxyBlock.java
================================================
/*
 *  Copyright (C) 2020-2021 GrammaTech, Inc.
 *
 *  This code is licensed under the MIT license. See the LICENSE file in the
 *  project root for license terms.
 *
 *  This project is sponsored by the Office of Naval Research, One Liberty
 *  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
 *  N68335-17-C-0700.  The content of the information does not necessarily
 *  reflect the position or policy of the Government and no official
 *  endorsement should be inferred.
 *
 */

package com.grammatech.gtirb;

import com.grammatech.gtirb.proto.ProxyBlockOuterClass;
import java.io.IOException;
import java.util.Optional;
import java.util.UUID;

/**
 * ProxyBlock is a placeholder that serves as the end point (source or target)
 * of a CfgEdge.
 */
public class ProxyBlock extends Node {

    private Optional<Module> module;

    /**
     * Class constructor for a ProxyBlock from a protobuf section.
     * @param  protoProxyBlock  The ProxyBlock as serialized into a protocol
     * buffer.
     */
    private ProxyBlock(ProxyBlockOuterClass.ProxyBlock protoProxyBlock)
        throws IOException {
        super(Util.byteStringToUuid(protoProxyBlock.getUuid()));
        this.module = Optional.empty();
    }

    /**
     * Class Constructor.
     */
    public ProxyBlock() {
        super();
        this.module = Optional.empty();
    }

    public ProxyBlock(UUID uuid) {
        super(uuid);
        this.module = Optional.empty();
    }

    /**
     * Get the {@link Module} this ProxyBlock belongs to.
     *
     * @return  An Optional that contains the Module this
     * proxy block belongs to, or empty if it does not belong to a Module.
     */
    public Optional<Module> getModule() { return this.module; }

    /**
     * Set the Module this ProxyBlock belongs to.
     *
     * @param  An Optional that contains the Module this
     * proxy block belongs to, or empty if it does not belong to a Module.
     */
    void setModule(Optional<Module> module) { this.module = module; }

    /**
     * De-serialize a {@link ProxyBlock} from a protobuf .
     *
     * @param  protoProxyBlock  The ProxyBlock as serialized into a protocol
     * buffer.
     * @param  module        The Module that owns this Section.
     * @return An initialized proxy block.
     */
    static ProxyBlock
    fromProtobuf(ProxyBlockOuterClass.ProxyBlock protoProxyBlock, Module module)
        throws IOException {
        return new ProxyBlock(protoProxyBlock);
    }

    /**
     * Serialize this ProxyBlock into a protobuf .
     *
     * @return A protocol buffer containing this ProxyBlock.
     */
    ProxyBlockOuterClass.ProxyBlock.Builder toProtobuf() {
        ProxyBlockOuterClass.ProxyBlock.Builder protoProxyBlock =
            ProxyBlockOuterClass.ProxyBlock.newBuilder();
        protoProxyBlock.setUuid(Util.uuidToByteString(this.getUuid()));
        return protoProxyBlock;
    }
}


================================================
FILE: java/com/grammatech/gtirb/Section.java
================================================
/*
 *  Copyright (C) 2020-2023 GrammaTech, Inc.
 *
 *  This code is licensed under the MIT license. See the LICENSE file in the
 *  project root for license terms.
 *
 *  This project is sponsored by the Office of Naval Research, One Liberty
 *  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
 *  N68335-17-C-0700.  The content of the information does not necessarily
 *  reflect the position or policy of the Government and no official
 *  endorsement should be inferred.
 *
 */

package com.grammatech.gtirb;

import com.grammatech.gtirb.proto.ByteIntervalOuterClass;
import com.grammatech.gtirb.proto.SectionOuterClass;
import java.io.IOException;
import java.util.ArrayList;
import java.util.Collections;
import java.util.HashSet;
import java.util.Iterator;
import java.util.List;
import java.util.NoSuchElementException;
import java.util.Optional;
import java.util.OptionalLong;
import java.util.Set;
import java.util.TreeMap;

/**
 * The Section class represents a named section or segment of a program file,
 * with flags that define its settings and ByteIntervals to store binary
 * information.
 */
public class Section extends Node implements TreeListItem {

    /**
     * Identities the flags used for a section.
     */
    public enum SectionFlag {
        Undefined,
        Readable,
        Writable,
        Executable,
        Loaded,
        Initialized,
        ThreadLocal
    }

    private Optional<Module> module;
    private String name;
    private final TreeMap<Long, List<ByteInterval>> byteIntervalTree;
    private Set<SectionFlag> sectionFlags;

    /**
     * Class constructor for a Section from a protobuf section.
     * @param  protoSection  The section as serialized into a protocol buffer.
     */
    private Section(SectionOuterClass.Section protoSection) throws IOException {
        super(Util.byteStringToUuid(protoSection.getUuid()));

        this.name = protoSection.getName();
        this.module = Optional.empty();

        byteIntervalTree = new TreeMap<Long, List<ByteInterval>>();
        List<ByteIntervalOuterClass.ByteInterval> protoByteIntervalList =
            protoSection.getByteIntervalsList();
        for (ByteIntervalOuterClass.ByteInterval protoByteInterval :
             protoByteIntervalList) {
            ByteInterval byteInterval =
                ByteInterval.fromProtobuf(protoByteInterval);
            this.addByteInterval(byteInterval);
        }

        this.sectionFlags = new HashSet<SectionFlag>();
        for (Integer value : protoSection.getSectionFlagsValueList()) {
            SectionFlag newSectionFlag = SectionFlag.values()[value];
            this.addSectionFlag(newSectionFlag);
        }
    }

    /**
     * Class Constructor.
     * @param  name            The name of this Section.
     * @param  flags           A set of flags to apply to this Section.
     * @param  byteIntervals   A list of ByteIntervals belonging to this
     * Section.
     */
    public Section(String name, Set<SectionFlag> flags,
                   List<ByteInterval> byteIntervals) {
        super();
        this.module = Optional.empty();
        this.setName(name);

        this.sectionFlags = new HashSet<SectionFlag>();
        for (SectionFlag flag : flags)
            this.addSectionFlag(flag);

        this.byteIntervalTree = new TreeMap<Long, List<ByteInterval>>();
        for (ByteInterval byteInterval : byteIntervals)
            this.addByteInterval(byteInterval);
    }

    /**
     * Get the {@link Module} this Section belongs to.
     *
     * @return  An Optional that contains the Module this
     * section belongs to, or empty if it does not belong to a Module.
     */
    public Optional<Module> getModule() { return this.module; }

    /**
     * Set the Module this Section belongs to.
     *
     * @param  module An Optional that contains the Module this
     * section belongs to, or empty if it does not belong to a Module.
     */
    public void setModule(Optional<Module> module) { this.module = module; }

    /**
     * Get the name of a {@link Section Section}.
     *
     * @return  The section name.
     */
    public String getName() { return this.name; }

    /**
     * Set the name of this Section.
     *
     * @param name    The section name.
     */
    public void setName(String name) { this.name = name; }

    /**
     * Get a ByteInterval iterator.
     *
     * @return  An iterator for iterating through all the ByteIntervals in this
     * Section.
     */
    private Iterator<ByteInterval> getByteIntervalIterator() {
        TreeListUtils<ByteInterval> byteIntervalTreeIterator =
            new TreeListUtils<ByteInterval>(this.byteIntervalTree);
        return byteIntervalTreeIterator.iterator();
    }

    /**
     * Get the ByteIntervals belonging to this Section.
     *
     * @return  An unmodifiable {@link ByteInterval} list of all the
     * byte intervals in this {@link Section}.
     */
    public List<ByteInterval> getByteIntervals() {
        List<ByteInterval> resultList = new ArrayList<ByteInterval>();
        Iterator<ByteInterval> byteIntervals = this.getByteIntervalIterator();
        while (byteIntervals.hasNext())
            resultList.add(byteIntervals.next());
        return Collections.unmodifiableList(resultList);
    }

    /**
     * Add a ByteInterval.
     *
     * @param byteInterval A {@link ByteInterval} to add to this Section.
     */
    public void addByteInterval(ByteInterval byteInterval) {
        TreeListUtils.insertItem(byteInterval, byteIntervalTree);
        byteInterval.setSection(Optional.of(this));
    }

    /**
     * Remove a ByteInterval.
     *
     * @param byteInterval A {@link ByteInterval} to remove from this Section.
     * @return boolean true if this section contained the byte interval, and it
     * was removed.
     */
    public boolean removeByteInterval(ByteInterval byteInterval) {
        if (byteInterval.getSection().isPresent() &&
            byteInterval.getSection().get() == this) {
            TreeListUtils.removeItem(byteInterval, byteIntervalTree);
            byteInterval.setSection(Optional.empty());
            return true;
        } else
            return false;
    }

    /**
     * Get the flags applying to this Section.
     *
     * @return  An unmodifiable {@link SectionFlag} set of all the
     * section flags of this {@link Section}.
     */
    public Set<SectionFlag> getSectionFlags() {
        return Collections.unmodifiableSet(this.sectionFlags);
    }

    /**
     * Add a Section flag.
     *
     * @param sectionFlag A {@link SectionFlag} that will be applied to this
     * Section.
     */
    public void addSectionFlag(SectionFlag sectionFlag) {
        this.sectionFlags.add(sectionFlag);
    }

    /**
     * Remove a Section flag.
     *
     * @param sectionFlag A {@link SectionFlag} to be removed from this
     * Section.
     * @return boolean true if this section contained the section flag, and it
     * was removed.
     */
    public boolean removeSectionFlag(SectionFlag sectionFlag) {
        return (this.sectionFlags.remove(sectionFlag));
    }

    /**
     * Return the size of this section, if known.
     *
     * The size is calculated from the {@link ByteInterval} objects in this
     * section. More specifically, if the address of all byte intervals in this
     * section are fixed, then it will return the difference between the lowest
     * and highest address among the intervals. If any one interval does not
     * have an address, then this function will return null, as the size is not
     * calculable in that case. Note that a section with no intervals in it has
     * no address or size, so it will return null in that case.
     *
     * @return The size of this section if known, otherwise 0.
     */
    public long getSize() {
        if (byteIntervalTree.size() == 0)
            return 0;

        // Check whether any ByteIntervals lack an address.
        // A BI inserted without an address would use 0 for a key.
        if (this.byteIntervalTree.containsKey(0L)) {
            for (ByteInterval byteInterval : byteIntervalTree.get(0L)) {
                if (!byteInterval.hasAddress())
                    return 0;
            }
        }

        // If we get here, there is at least one ByteInterval, and every one has
        // an address.
        Iterator<ByteInterval> byteIntervalTreeIterator =
            this.getByteIntervalIterator();
        ByteInterval byteInterval = byteIntervalTreeIterator.next();
        long sectionStart =
            byteInterval.getAddress().orElseThrow(NoSuchElementException::new);
        long sectionEnd = sectionStart + byteInterval.getSize();
        while (byteIntervalTreeIterator.hasNext()) {
            byteInterval = byteIntervalTreeIterator.next();
            long biStart = byteInterval.getAddress().orElseThrow(
                NoSuchElementException::new);
            long biEnd = biStart + byteInterval.getSize();
            if (Long.compareUnsigned(biStart, sectionStart) < 0L)
                sectionStart = biStart;
            if (Long.compareUnsigned(biEnd, sectionEnd) > 0L)
                sectionEnd = biEnd;
        }
        return sectionEnd - sectionStart;
    }

    /**
     * Return the address of this section, if known.
     *
     * The address is calculated from the {@link ByteInterval} objects in this
     * section. More specifically, if the address of all byte intervals in this
     * section are fixed, then it will return the address of the interval lowest
     * in memory. If any one interval does not have an address, then this
     * function will return null, as the address is not calculable in that case.
     * Note that a section with no intervals in it has no address or size, so it
     * will return null in that case.
     *
     * @return The address of this section if known, otherwise null.
     */
    public OptionalLong getAddress() {
        if (byteIntervalTree.size() == 0)
            return OptionalLong.empty();
        Iterator<ByteInterval> byteIntervalTreeIterator =
            this.getByteIntervalIterator();
        OptionalLong minAddress = OptionalLong.empty();
        while (byteIntervalTreeIterator.hasNext()) {
            ByteInterval byteInterval = byteIntervalTreeIterator.next();
            OptionalLong biAddress = byteInterval.getAddress();
            if (!biAddress.isPresent())
                return OptionalLong.empty();
            // This iterator is sorted, but with signed comparison.
            // Checking every ByteInterval here instead of just using the first
            // iteration helps avoid any (unlikely) signedness issues.
            if (!minAddress.isPresent() ||
                Long.compareUnsigned(minAddress.getAsLong(),
                                     biAddress.getAsLong()) > 0)
                minAddress = biAddress;
        }
        // Return the start of the first byte interval
        return minAddress;
    }

    /**
     * Get the index to manage this Section with.
     *
     * This index is used for storing and retrieving the Section, as
     * required by the TreeListItem interface. Sections are ordered by
     * address, so this method just returns the address.
     * @return  The ByteInterval index, which is it's address.
     */
    public long getIndex() { return this.getAddress().orElse(0); }

    /**
     * Get all ByteIntervals containing an address.
     *
     * @param address      The address to look for.
     * @return             A list of ByteIntervals that intersect this address,
     * or empty list if none.
     */
    public List<ByteInterval> findByteIntervalsOn(long address) {
        return TreeListUtils.getItemsIntersectingIndex(address,
                                                       this.byteIntervalTree);
    }

    /**
     * Get all ByteIntervals containing any address in a range.
     *
     * @param startAddress      The beginning of the address range to look for.
     * (inclusive)
     * @param endAddress        The last address of the address range to look
     * for. (exclusive)
     * @return                  A list of ByteIntervals that intersect this
     * address range, or empty list if none.
     */
    public List<ByteInterval> findByteIntervalsOn(long startAddress,
                                                  long endAddress) {
        return TreeListUtils.getItemsIntersectingIndexRange(
            startAddress, endAddress, this.byteIntervalTree);
    }

    /**
     * Get all ByteIntervals that begin at an address.
     *
     * @param address      The address to look for.
     * @return             A list of ByteIntervals that that start at this
     * address, or null if none.
     */
    public List<ByteInterval> findByteIntervalsAt(long address) {
        return TreeListUtils.getItemsAtStartIndex(address,
                                                  this.byteIntervalTree);
    }

    /**
     * Get all ByteIntervals that begin at a range of addressees.
     *
     * @param startAddress      The beginning of the address range to look for.
     * (inclusive)
     * @param endAddress        The last address in the address to look for.
     * (exlusive)
     * @return                  A list of ByteIntervals that that start at this
     * address, or null if none.
     */
    public List<ByteInterval> findByteIntervalsAt(long startAddress,
                                                  long endAddress) {
        return TreeListUtils.getItemsAtStartIndexRange(startAddress, endAddress,
                                                       this.byteIntervalTree);
    }

    /**
     * De-serialize a {@link Section} from a protobuf .
     *
     * @return An initialized section.
     */
    static Section fromProtobuf(SectionOuterClass.Section protoSection)
        throws IOException {
        return new Section(protoSection);
    }

    /**
     * Serialize this Section into a protobuf .
     *
     * @return Section protocol buffer.
     */
    SectionOuterClass.Section.Builder toProtobuf() {
        SectionOuterClass.Section.Builder protoSection =
            SectionOuterClass.Section.newBuilder();
        protoSection.setUuid(Util.uuidToByteString(this.getUuid()));
        protoSection.setName(this.getName());

        // Add byte intervals
        Iterator<ByteInterval> byteIntervals = this.getByteIntervalIterator();
        while (byteIntervals.hasNext()) {
            ByteInterval byteInterval = byteIntervals.next();
            ByteIntervalOuterClass.ByteInterval.Builder protoByteInterval =
                byteInterval.toProtobuf();
            protoSection.addByteIntervals(protoByteInterval);
        }

        for (SectionFlag sectionFlag : this.sectionFlags)
            protoSection.addSectionFlagsValue(sectionFlag.ordinal());
        return protoSection;
    }
}


================================================
FILE: java/com/grammatech/gtirb/SectionPropertyTuple.java
================================================
package com.grammatech.gtirb;

import com.grammatech.gtirb.tuple.Tuple2;

/**
 * A tuple for representing information about section properties in ELF files.
 */
public class SectionPropertyTuple extends Tuple2<Long, Long> {
    /**
     * Constructor for building a tuple for a section.
     *
     * @param type The type of the section.
     * @param flags The flags for the section.
     */
    public SectionPropertyTuple(Long type, Long flags) { super(type, flags); }

    /**
     * Get the type of the section.
     *
     * @return The type of the section.
     */
    public Long getType() { return this.get0(); }

    /**
     * Get the flags attached to the section.
     *
     * @return The flags for the section.
     */
    public Long getFlags() { return this.get1(); }
}


================================================
FILE: java/com/grammatech/gtirb/SymAddrAddr.java
================================================
/*
 *  Copyright (C) 2020-2023 GrammaTech, Inc.
 *
 *  This code is licensed under the MIT license. See the LICENSE file in the
 *  project root for license terms.
 *
 *  This project is sponsored by the Office of Naval Research, One Liberty
 *  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
 *  N68335-17-C-0700.  The content of the information does not necessarily
 *  reflect the position or policy of the Government and no official
 *  endorsement should be inferred.
 *
 */

package com.grammatech.gtirb;

import com.grammatech.gtirb.proto.SymbolicExpressionOuterClass;
import java.io.IOException;
import java.util.Set;
import java.util.UUID;

/**
 *
 * The SymAddrAddr class represents a symbolic operand of the form "(Sym1 -
 Sym2) / Scale + Offset".

 */
public class SymAddrAddr extends SymbolicExpression {

    private long scale;
    private long offset;
    private UUID symbol1_uuid;
    private UUID symbol2_uuid;

    /**
     * Class constructor for a SymAddrAddr from a protobuf symbolic
     * expression.
     * @param  protoSymbolicExpression  The SymAddrAddr symbolic expression, as
     * serialized into a protocol buffer.
     */
    public SymAddrAddr(
        SymbolicExpressionOuterClass.SymbolicExpression protoSymbolicExpression)
        throws IOException {
        super(protoSymbolicExpression);
        SymbolicExpressionOuterClass.SymAddrAddr protoSymAddrAddr =
            protoSymbolicExpression.getAddrAddr();
        this.setSymbol1Uuid(
            Util.byteStringToUuid(protoSymAddrAddr.getSymbol1Uuid()));
        this.setSymbol2Uuid(
            Util.byteStringToUuid(protoSymAddrAddr.getSymbol2Uuid()));
        this.setScale(protoSymAddrAddr.getScale());
        this.setOffset(protoSymAddrAddr.getOffset());
    }

    /**
     * Class constructor for a SymbolicExpression.
     * @param  offset           The constant offset operand.
     * @param  scale            The scale applied to the symbol difference.
     * @param  symbol1_uuid     The UUID of the first symbolic operand.
     * @param  symbol2_uuid     The UUID of the second symbolic operand.
     * @param  attributeFlags   A list of applicable attributes. May be empty.
     */
    public SymAddrAddr(long offset, long scale, UUID symbol1_uuid,
                       UUID symbol2_uuid, Set<AttributeFlag> attributeFlags) {
        super(attributeFlags);
        this.setScale(scale);
        this.setOffset(offset);
        this.setSymbol1Uuid(symbol1_uuid);
        this.setSymbol2Uuid(symbol2_uuid);
    }

    /**
     * Get the symbol UUID of the first operand in this SymAddrAddr.
     *
     * @return  The UUID of the first symbolic operand of this expression.
     */
    public UUID getSymbol1Uuid() { return symbol1_uuid; }

    /**
     * Set the symbol UUID of the first operand in this SymAddrAddr.
     *
     * @param symbol_uuid    New value for the UUID of the first symbolic
     * operand of the expression.
     */
    public void setSymbol1Uuid(UUID symbol_uuid) {
        this.symbol1_uuid = symbol_uuid;
    }

    /**
     * Get the symbol UUID of the second operand in this SymAddrAddr.
     *
     * @return  The UUID of the second symbolic operand of this expression.
     */
    public UUID getSymbol2Uuid() { return symbol2_uuid; }

    /**
     * Set the symbol UUID of the second operand in this SymAddrAddr.
     *
     * @param symbol_uuid    New value for the UUID of the second symbolic
     * operand of the expression.
     */
    public void setSymbol2Uuid(UUID symbol_uuid) {
        this.symbol2_uuid = symbol_uuid;
    }

    /**
     * Get the scale this SymAddrAddr.
     *
     * @return        The SymAddrAddr scale
     */
    public long getScale() { return scale; }

    /**
     * Set the scale this SymAddrAddr.
     *
     * @param scale    The new scale to set the SymAddrAddr scale to
     */
    public void setScale(long scale) { this.scale = scale; }

    /**
     * Gets the constant offset of this SymAddrAddr
     * @return The current offset value
     */
    public long getOffset() { return this.offset; }

    /**
     * Sets the constant offset of this SymAddrAddr.
     * @param offset New value for the constant offset.
     */
    public void setOffset(long offset) { this.offset = offset; }

    /**
     * De-serialize a {@link SymAddrAddr} from a protobuf .
     *
     * @param  protoSymbolicExpression     The symbolic expression as serialized
     * into a protocol buffer.
     * @return An initialized SymAddrAddr.
     */
    public static SymAddrAddr fromProtobuf(
        SymbolicExpressionOuterClass.SymbolicExpression protoSymbolicExpression)
        throws IOException {
        return new SymAddrAddr(protoSymbolicExpression);
    }

    /**
     * Serialize this SymAddrConst into a protobuf.
     *
     * @return Block protocol buffer containing this SymAddrConst.
     */
    @Override
    public SymbolicExpressionOuterClass.SymbolicExpression.Builder
    toProtobuf() {
        SymbolicExpressionOuterClass.SymbolicExpression
            .Builder protoSymbolicExpression =
            SymbolicExpressionOuterClass.SymbolicExpression.newBuilder();
        SymbolicExpressionOuterClass.SymAddrAddr.Builder protoSymAddrAddr =
            SymbolicExpressionOuterClass.SymAddrAddr.newBuilder();
        protoSymAddrAddr.setSymbol1Uuid(
            Util.uuidToByteString(this.getSymbol1Uuid()));
        protoSymAddrAddr.setSymbol2Uuid(
            Util.uuidToByteString(this.getSymbol2Uuid()));
        protoSymAddrAddr.setOffset(this.getOffset());
        protoSymbolicExpression.setAddrAddr(protoSymAddrAddr);

        // NOTE for this to be valid, a one-to-one mapping of enums must be
        // maintained
        for (AttributeFlag attributeFlag : this.getAttributeFlags())
            protoSymbolicExpression.addAttributeFlagsValue(
                attributeFlag.ordinal());
        for (Integer value : this.getUnknownAttributeFlags()) {
            protoSymbolicExpression.addAttributeFlagsValue(value);
        }
        return protoSymbolicExpression;
    }
}


================================================
FILE: java/com/grammatech/gtirb/SymAddrConst.java
================================================
/*
 *  Copyright (C) 2020-2023 GrammaTech, Inc.
 *
 *  This code is licensed under the MIT license. See the LICENSE file in the
 *  project root for license terms.
 *
 *  This project is sponsored by the Office of Naval Research, One Liberty
 *  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
 *  N68335-17-C-0700.  The content of the information does not necessarily
 *  reflect the position or policy of the Government and no official
 *  endorsement should be inferred.
 *
 */

package com.grammatech.gtirb;

import com.grammatech.gtirb.proto.SymbolicExpressionOuterClass;
import java.io.IOException;
import java.util.Set;
import java.util.UUID;

/**
 * The SymAddConst class represents a symbolic operand of the form "Sym +
 * Offset".
 */
public class SymAddrConst extends SymbolicExpression {

    private UUID symbol_uuid;
    private long offset;

    /**
     * Class constructor for a SymAddrConst from a protobuf symbolic expression.
     * @param  protoSymbolicExpression  The symbolic expression as serialized
     * into a protocol buffer.
     */
    public SymAddrConst(
        SymbolicExpressionOuterClass.SymbolicExpression protoSymbolicExpression)
        throws IOException {
        super(protoSymbolicExpression);
        SymbolicExpressionOuterClass.SymAddrConst protoSymAddrConst =
            protoSymbolicExpression.getAddrConst();
        this.setSymbolUuid(
            Util.byteStringToUuid(protoSymAddrConst.getSymbolUuid()));
        this.offset = protoSymAddrConst.getOffset();
    }

    /**
     * Class constructor for a SymAddrConst.
     * @param  offset          The offset of this symbolic expression in the
     * ByteInterval.
     * @param  symbol_uuid     The UUID of the symbolic operand.
     */
    public SymAddrConst(long offset, UUID symbol_uuid,
                        Set<AttributeFlag> attributeFlags) {
        super(attributeFlags);
        this.setSymbolUuid(symbol_uuid);
        this.offset = offset;
    }

    /**
     * Get the symbol UUID of this SymAddrConst.
     *
     * @return  The UUID of the symbolic operand of this expression.
     */
    public UUID getSymbolUuid() { return symbol_uuid; }

    /**
     * Set the symbol UUID of this SymAddrConst.
     *
     * @param  symbol_uuid    New value for the UUID of the symbolic operand of
     * the expression.
     */
    public void setSymbolUuid(UUID symbol_uuid) {
        this.symbol_uuid = symbol_uuid;
    }

    /**
     * Gets the symbol-relative constant offset of this SymAddrConst.
     * @return The current offset value
     */
    public long getOffset() { return this.offset; }

    /**
     * Sets the symbol-relative constant offset of this SymAddrConst.
     * @param offset New value for the constant offset.
     */
    public void setOffset(long offset) { this.offset = offset; }

    /**
     * De-serialize a {@link SymAddrConst} from a protobuf.
     *
     * @param  protoSymbolicExpression  The symbolic expression as serialized
     * into a protocol buffer.
     * @return An initialized SymAddrConst
     */
    public static SymAddrConst fromProtobuf(
        SymbolicExpressionOuterClass.SymbolicExpression protoSymbolicExpression)
        throws IOException {
        return new SymAddrConst(protoSymbolicExpression);
    }

    /**
     * Serialize this SymAddrConst into a protobuf.
     *
     * @return Block protocol buffer containing this SymAddrConst.
     */
    @Override
    public SymbolicExpressionOuterClass.SymbolicExpression.Builder
    toProtobuf() {
        SymbolicExpressionOuterClass.SymbolicExpression
            .Builder protoSymbolicExpression =
            SymbolicExpressionOuterClass.SymbolicExpression.newBuilder();
        SymbolicExpressionOuterClass.SymAddrConst.Builder protoSymAddrConst =
            SymbolicExpressionOuterClass.SymAddrConst.newBuilder();
        protoSymAddrConst.setSymbolUuid(
            Util.uuidToByteString(this.getSymbolUuid()));
        protoSymAddrConst.setOffset(this.getOffset());
        protoSymbolicExpression.setAddrConst(protoSymAddrConst);
        // NOTE for this to be valid, a one-to-one mapping of enums must be
        // maintained
        for (AttributeFlag attributeFlag : this.getAttributeFlags())
            protoSymbolicExpression.addAttributeFlagsValue(
                attributeFlag.ordinal());
        for (Integer value : this.getUnknownAttributeFlags()) {
            protoSymbolicExpression.addAttributeFlagsValue(value);
        }
        return protoSymbolicExpression;
    }
}


================================================
FILE: java/com/grammatech/gtirb/Symbol.java
================================================
/*
 *  Copyright (C) 2020-2023 GrammaTech, Inc.
 *
 *  This code is licensed under the MIT license. See the LICENSE file in the
 *  project root for license terms.
 *
 *  This project is sponsored by the Office of Naval Research, One Liberty
 *  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
 *  N68335-17-C-0700.  The content of the information does not necessarily
 *  reflect the position or policy of the Government and no official
 *  endorsement should be inferred.
 *
 */

package com.grammatech.gtirb;

import com.grammatech.gtirb.proto.SymbolOuterClass;
import java.io.IOException;
import java.util.Optional;
import java.util.OptionalLong;
import java.util.UUID;

/**
 * Maps a name to an object in the IR.
 * A Symbol may have a referent or a value, or neither. A referent is
 * a ByteBlock, somewhere in the IR. A value is an integer.
 * Use the hasValue() method to determine if the payload is a value,
 * hasReferent to determine if it has a referent.
 */
public class Symbol extends Node {

    /**
     * 	Symbol payload options.
     */
    public enum PayloadType { REFERENT, VALUE, NONE }

    private Optional<Module> module;
    private String name;
    private long value;
    private UUID referentUuid;
    private PayloadType payloadType;
    private boolean atEnd;

    /**
     * Class constructor for a Symbol from a protobuf symbol.
     * @param  protoSymbol   The Symbol as serialized into a protocol buffer.
     */
    private Symbol(SymbolOuterClass.Symbol protoSymbol) throws IOException {
        super(Util.byteStringToUuid(protoSymbol.getUuid()));
        this.module = Optional.empty();
        this.name = protoSymbol.getName();
        this.atEnd = protoSymbol.getAtEnd();
        // Set default values:
        this.value = 0;
        this.referentUuid = Util.NIL_UUID; // init to null as fallback
        // Determine payload for this symbol, if there is one:
        if (protoSymbol.getOptionalPayloadCase() ==
            SymbolOuterClass.Symbol.OptionalPayloadCase.VALUE) {
            this.value = protoSymbol.getValue();
            this.payloadType = PayloadType.VALUE;
        } else if (protoSymbol.getOptionalPayloadCase() ==
                   SymbolOuterClass.Symbol.OptionalPayloadCase.REFERENT_UUID) {
            this.referentUuid =
                Util.byteStringToUuid(protoSymbol.getReferentUuid());
            this.payloadType = PayloadType.REFERENT;
        } else {
            this.payloadType = PayloadType.NONE;
        }
    }

    /**
     * Class constructor for a Symbol with a referent payload.
     * @param  name          The section as serialized into a protocol buffer.
     * @param  referentUuid  The symbol referent as a UUID.
     */
    public Symbol(String name, UUID referentUuid) {
        super();
        this.module = Optional.empty();
        this.name = name;
        this.referentUuid = referentUuid;
        this.payloadType = PayloadType.REFERENT;
        this.value = 0;
        this.atEnd = false; // default to not being at end
    }

    /**
     * Class constructor for a Symbol with a value payload.
     * @param  name          The section as serialized into a protocol buffer.
     * @param  value         The symbol value.
     */
    public Symbol(String name, long value) {
        super();
        this.module = Optional.empty();
        this.name = name;
        this.value = value;
        this.payloadType = PayloadType.VALUE;
        this.referentUuid = Util.NIL_UUID;
        this.atEnd = false; // default to not being at end
    }

    /**
     * Class constructor for a minimal Symbol with no payload.
     * @param  name          The section as serialized into a protocol buffer.
     */
    public Symbol(String name) {
        super();
        this.module = Optional.empty();
        this.name = name;
        this.payloadType = PayloadType.NONE;
        this.value = 0;
        this.referentUuid = Util.NIL_UUID;
        this.atEnd = false; // default to not being at end
    }

    /**
     * Get the {@link Module} this Symbol belongs to.
     *
     * @return  An Optional that contains the Module this
     * symbol belongs to, or empty if it does not belong to a Module.
     */
    public Optional<Module> getModule() { return this.module; }

    /**
     * Set the Module this Symbol belongs to.
     *
     * @param  module An Optional that contains the Module this
     * symbol belongs to, or empty if it does not belong to a Module.
     */
    public void setModule(Optional<Module> module) { this.module = module; }

    /**
     * Get the name of this Symbol.
     *
     * @return  The symbol name.
     */
    public String getName() { return name; }

    /**
     * Set the name of this Symbol.
     *
     * @param name    The symbol name.
     */
    public void setName(String name) { this.name = name; }

    /**
     * Get the referent of this Symbol.
     *
     * @return  The symbol's referent, or null if there is no referent.
     */
    public Node getReferent() {
        if (this.payloadType == PayloadType.REFERENT)
            return Node.getByUuid(this.referentUuid);
        return null;
    }

    /**
     * Get the UUID of this Symbol's referent.
     *
     * @return  An Optional that has the UUID of this symbol's referent, if it
     * has one.
     */
    public Optional<UUID> getReferentUuid() {
        if (this.payloadType == PayloadType.REFERENT)
            return Optional.of(this.referentUuid);
        return Optional.empty();
    }

    /**
     * Set the UUID of this Symbol's referent.
     *
     * Calling this method will set the payload type to REFERENT.
     *
     * @param uuid  The UUID of this symbol's referent..
     */
    public void setReferentUuid(UUID uuid) {
        this.referentUuid = uuid;
        this.payloadType = PayloadType.REFERENT;
    }

    /**
     * Get the value of this Symbol.
     *
     * @return  An OptionalLong that has the symbol value, if it has one.
     */
    public OptionalLong getValue() {
        if (this.payloadType == PayloadType.VALUE)
            return OptionalLong.of(this.value);
        return OptionalLong.empty();
    }

    /**
     * Set the value of this Symbol.
     *
     * @param value   The symbol value.
     */
    public void setValue(long value) {
        this.value = value;
        this.payloadType = PayloadType.VALUE;
    }

    /**
     * Get the payload type of this Symbol.
     *
     * @return  The symbol name.
     */
    public PayloadType getPayloadType() { return this.payloadType; }

    /**
     * Get whether symbol is at end.
     *
     * @return true if symbol is at end, false otherwise.
     */
    public boolean isAtEnd() { return this.atEnd; }

    /**
     * Set whether symbol is at end.

     * @param atEnd The at end value to set
     */
    public void setAtEnd(boolean atEnd) { this.atEnd = atEnd; }

    /**
     * De-serialize a {@link Symbol} from a protobuf .
     *
     * @param protoSymbol The protobuf version of this symbol
     * @return An initialized symbol.
     */
    static Symbol fromProtobuf(SymbolOuterClass.Symbol protoSymbol)
        throws IOException {
        return new Symbol(protoSymbol);
    }

    /**
     * Serialize this Symbol into a protobuf.
     *
     * @return Symbol protocol buffer.
     */
    SymbolOuterClass.Symbol.Builder toProtobuf() {
        SymbolOuterClass.Symbol.Builder protoSymbol =
            SymbolOuterClass.Symbol.newBuilder();
        protoSymbol.setUuid(Util.uuidToByteString(this.getUuid()));
        protoSymbol.setName(this.getName());
        protoSymbol.clearOptionalPayload();
        if (this.payloadType == PayloadType.VALUE)
            protoSymbol.setValue(this.value);
        else if (this.payloadType == PayloadType.REFERENT)
            protoSymbol.setReferentUuid(
                Util.uuidToByteString(this.referentUuid));
        return protoSymbol;
    }
}


================================================
FILE: java/com/grammatech/gtirb/SymbolicExpression.java
================================================
/*
 *  Copyright (C) 2020-2023 GrammaTech, Inc.
 *
 *  This code is licensed under the MIT license. See the LICENSE file in the
 *  project root for license terms.
 *
 *  This project is sponsored by the Office of Naval Research, One Liberty
 *  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
 *  N68335-17-C-0700.  The content of the information does not necessarily
 *  reflect the position or policy of the Government and no official
 *  endorsement should be inferred.
 *
 */

package com.grammatech.gtirb;

import com.grammatech.gtirb.proto.SymbolicExpressionOuterClass;
import java.io.IOException;
import java.util.Collections;
import java.util.HashMap;
import java.util.HashSet;
import java.util.Map;
import java.util.Set;

/**
 * The Symbolic Expression class is a base class for expressions such as
 * SymAddrConst, SymAddrAddr, and SymStackConst.
 */
public class SymbolicExpression {

    /**
     * Attributes for Symbolic Expressions.
     *
     * @see <a
     *     href="https://grammatech.github.io/gtirb/md__symbolic_expression.html">SymbolicExpression</a>
     */
    public enum AttributeFlag {
        GOT(SymbolicExpressionOuterClass.SymAttribute.GOT_VALUE),
        GOTPC(SymbolicExpressionOuterClass.SymAttribute.GOTPC_VALUE),
        GOTOFF(SymbolicExpressionOuterClass.SymAttribute.GOTOFF_VALUE),
        GOTREL(SymbolicExpressionOuterClass.SymAttribute.GOTREL_VALUE),
        PLT(SymbolicExpressionOuterClass.SymAttribute.PLT_VALUE),
        PLTOFF(SymbolicExpressionOuterClass.SymAttribute.PLTOFF_VALUE),
        PCREL(SymbolicExpressionOuterClass.SymAttribute.PCREL_VALUE),
        SECREL(SymbolicExpressionOuterClass.SymAttribute.SECREL_VALUE),
        TLS(SymbolicExpressionOuterClass.SymAttribute.TLS_VALUE),
        TLSGD(SymbolicExpressionOuterClass.SymAttribute.TLSGD_VALUE),
        TLSLD(SymbolicExpressionOuterClass.SymAttribute.TLSLD_VALUE),
        TLSLDM(SymbolicExpressionOuterClass.SymAttribute.TLSLDM_VALUE),
        TLSCALL(SymbolicExpressionOuterClass.SymAttribute.TLSCALL_VALUE),
        TLSDESC(SymbolicExpressionOuterClass.SymAttribute.TLSDESC_VALUE),
        TPREL(SymbolicExpressionOuterClass.SymAttribute.TPREL_VALUE),
        TPOFF(SymbolicExpressionOuterClass.SymAttribute.TPOFF_VALUE),
        DTPREL(SymbolicExpressionOuterClass.SymAttribute.DTPREL_VALUE),
        DTPOFF(SymbolicExpressionOuterClass.SymAttribute.DTPOFF_VALUE),
        DTPMOD(SymbolicExpressionOuterClass.SymAttribute.DTPMOD_VALUE),
        NTPOFF(SymbolicExpressionOuterClass.SymAttribute.NTPOFF_VALUE),
        PAGE(SymbolicExpressionOuterClass.SymAttribute.PAGE_VALUE),
        PAGEOFF(SymbolicExpressionOuterClass.SymAttribute.PAGEOFF_VALUE),
        CALL(SymbolicExpressionOuterClass.SymAttribute.CALL_VALUE),
        LO(SymbolicExpressionOuterClass.SymAttribute.LO_VALUE),
        HI(SymbolicExpressionOuterClass.SymAttribute.HI_VALUE),
        HIGHER(SymbolicExpressionOuterClass.SymAttribute.HIGHER_VALUE),
        HIGHEST(SymbolicExpressionOuterClass.SymAttribute.HIGHEST_VALUE),
        GOTNTPOFF(SymbolicExpressionOuterClass.SymAttribute.GOTNTPOFF_VALUE),
        INDNTPOFF(SymbolicExpressionOuterClass.SymAttribute.INDNTPOFF_VALUE),
        G0(SymbolicExpressionOuterClass.SymAttribute.G0_VALUE),
        G1(SymbolicExpressionOuterClass.SymAttribute.G1_VALUE),
        G2(SymbolicExpressionOuterClass.SymAttribute.G2_VALUE),
        G3(SymbolicExpressionOuterClass.SymAttribute.G3_VALUE),
        UPPER16(SymbolicExpressionOuterClass.SymAttribute.UPPER16_VALUE),
        LOWER16(SymbolicExpressionOuterClass.SymAttribute.LOWER16_VALUE),
        LO12(SymbolicExpressionOuterClass.SymAttribute.LO12_VALUE),
        LO15(SymbolicExpressionOuterClass.SymAttribute.LO15_VALUE),
        LO14(SymbolicExpressionOuterClass.SymAttribute.LO14_VALUE),
        HI12(SymbolicExpressionOuterClass.SymAttribute.HI12_VALUE),
        HI21(SymbolicExpressionOuterClass.SymAttribute.HI21_VALUE),
        S(SymbolicExpressionOuterClass.SymAttribute.S_VALUE),
        PG(SymbolicExpressionOuterClass.SymAttribute.PG_VALUE),
        NC(SymbolicExpressionOuterClass.SymAttribute.NC_VALUE),
        ABS(SymbolicExpressionOuterClass.SymAttribute.ABS_VALUE),
        PREL(SymbolicExpressionOuterClass.SymAttribute.PREL_VALUE),
        PREL31(SymbolicExpressionOuterClass.SymAttribute.PREL31_VALUE),
        TARGET1(SymbolicExpressionOuterClass.SymAttribute.TARGET1_VALUE),
        TARGET2(SymbolicExpressionOuterClass.SymAttribute.TARGET2_VALUE),
        SBREL(SymbolicExpressionOuterClass.SymAttribute.SBREL_VALUE),
        TLSLDO(SymbolicExpressionOuterClass.SymAttribute.TLSLDO_VALUE),
        HI16(SymbolicExpressionOuterClass.SymAttribute.HI16_VALUE),
        LO16(SymbolicExpressionOuterClass.SymAttribute.LO16_VALUE),
        GPREL(SymbolicExpressionOuterClass.SymAttribute.GPREL_VALUE),
        DISP(SymbolicExpressionOuterClass.SymAttribute.DISP_VALUE),
        OFST(SymbolicExpressionOuterClass.SymAttribute.OFST_VALUE),
        H(SymbolicExpressionOuterClass.SymAttribute.H_VALUE),
        L(SymbolicExpressionOuterClass.SymAttribute.L_VALUE),
        HA(SymbolicExpressionOuterClass.SymAttribute.HA_VALUE),
        HIGH(SymbolicExpressionOuterClass.SymAttribute.HIGH_VALUE),
        HIGHA(SymbolicExpressionOuterClass.SymAttribute.HIGHA_VALUE),
        HIGHERA(SymbolicExpressionOuterClass.SymAttribute.HIGHERA_VALUE),
        HIGHESTA(SymbolicExpressionOuterClass.SymAttribute.HIGHESTA_VALUE),
        TOCBASE(SymbolicExpressionOuterClass.SymAttribute.TOCBASE_VALUE),
        TOC(SymbolicExpressionOuterClass.SymAttribute.TOC_VALUE),
        NOTOC(SymbolicExpressionOuterClass.SymAttribute.NOTOC_VALUE),
        ;

        private final int value;
        private static final Map<Integer, AttributeFlag> mapping = initMap();

        AttributeFlag(int value) { this.value = value; }

        public int value() { return this.value; }

        public static AttributeFlag fromInteger(int value) {
            return mapping.get(value);
        }

        private static Map<Integer, AttributeFlag> initMap() {
            Map<Integer, AttributeFlag> mapping = new HashMap<>();
            for (AttributeFlag flag : AttributeFlag.values()) {
                mapping.put(flag.value(), flag);
            }
            return Collections.unmodifiableMap(mapping);
        }
    }

    private Set<AttributeFlag> attributeFlags;
    private Set<Integer> unknownAttributeFlags;

    /**
     * Class constructor for a SymbolicExpression from a protobuf symbolic
     * expression.
     * @param  protoSymbolicExpression     The symbolic expression as serialized
     * into a protocol buffer.
     */
    protected SymbolicExpression(
        SymbolicExpressionOuterClass.SymbolicExpression protoSymbolicExpression)
        throws IOException {
        this.attributeFlags = new HashSet<AttributeFlag>();
        this.unknownAttributeFlags = new HashSet<Integer>();

        for (Integer value :
             protoSymbolicExpression.getAttributeFlagsValueList()) {
            AttributeFlag attributeFlag = AttributeFlag.fromInteger(value);
            if (attributeFlag == null) {
                this.unknownAttributeFlags.add(value);
            } else {
                this.attributeFlags.add(attributeFlag);
            }
        }
    }

    /**
     * Class constructor for a SymbolicExpression.
     * @param  attributeFlags A set of flags that are applicable to this
     *                        symbolic expression.
     */
    protected SymbolicExpression(Set<AttributeFlag> attributeFlags) {
        this.attributeFlags = new HashSet<AttributeFlag>();
        for (AttributeFlag attributeFlag : attributeFlags)
            this.addAttributeFlag(attributeFlag);
        this.unknownAttributeFlags = new HashSet<Integer>();
    }

    /**
     * Get the flags applying to this SymbolicExpression.
     *
     * @return  An unmodifiable {@link AttributeFlag} set of all the
     * attribute flags in this {@link SymbolicExpression}.
     */
    public Set<AttributeFlag> getAttributeFlags() {
        return Collections.unmodifiableSet(this.attributeFlags);
    }

    /**
     * Add an attribute flags to this SymbolicExpression.
     *
     * @param attributeFlag An {@link AttributeFlag} that will be applied
     * to this symbolic expression.
     */
    public void addAttributeFlag(AttributeFlag attributeFlag) {
        this.attributeFlags.add(attributeFlag);
    }

    /**
     * Remove an attribute flags from this SymbolicExpression.
     *
     * @param attributeFlag An {@link AttributeFlag} that will be removed
     * from this symbolic expression.
     * @return boolean true if this symbolic expression contained the attribute
     * flag, and it was removed.
     */
    public boolean removeAttributeFlag(AttributeFlag attributeFlag) {
        return (this.attributeFlags.remove(attributeFlag));
    }

    /**
     * Get unknown attribute flags applying to this SymbolicExpression.
     *
     * @return  An unmodifiable list of all the unknown attribute
     * flags in this {@link SymbolicExpression}, as integers.
     */
    public Set<Integer> getUnknownAttributeFlags() {
        return Collections.unmodifiableSet(this.unknownAttributeFlags);
    }

    /**
     * Add an unknown attribute flag to this SymbolicExpression.
     *
     * @param unknownFlag An unknown attribute flag that will be applied
     * to this symbolic expression and stored as an integer.
     */
    public void addUnknownFlag(Integer unknownFlag) {
        this.unknownAttributeFlags.add(unknownFlag);
    }

    /**
     * Remove an unknown attribute flag from this SymbolicExpression.
     *
     * @param unknownFlag An unknown attribute flag that will be removed
     * to this symbolic expression.
     * @return boolean true if this symbolic expression contained the attribute
     * flag, and it was removed.
     */
    public boolean removeUnknownFlag(Integer unknownFlag) {
        return (this.unknownAttributeFlags.remove(unknownFlag));
    }

    /**
     * De-serialize a {@link SymbolicExpression} from a protobuf .
     *
     * @param protoSymbolicExpression The protobuf version of this
     * symbolicExpression
     * @return An initialized SymbolicExpression.
     */
    public static SymbolicExpression fromProtobuf(
        SymbolicExpressionOuterClass.SymbolicExpression protoSymbolicExpression)
        throws IOException {
        return new SymbolicExpression(protoSymbolicExpression);
    }

    /**
     * Serialize this SymbolicExpression into a protobuf.
     *
     * This method is intended to be overwritten in the subclasses.
     *
     * @return Protocol buffer containing this Symbolic Expression.
     */
    public SymbolicExpressionOuterClass.SymbolicExpression.Builder
    toProtobuf() {
        return SymbolicExpressionOuterClass.SymbolicExpression.newBuilder();
    }
}


================================================
FILE: java/com/grammatech/gtirb/TreeListItem.java
================================================
/*
 *  Copyright (C) 2020-2021 GrammaTech, Inc.
 *
 *  This code is licensed under the MIT license. See the LICENSE file in the
 *  project root for license terms.
 *
 *  This project is sponsored by the Office of Naval Research, One Liberty
 *  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
 *  N68335-17-C-0700.  The content of the information does not necessarily
 *  reflect the position or policy of the Government and no official
 *  endorsement should be inferred.
 *
 */

package com.grammatech.gtirb;

/**
 * Interface for generic items to be stored in sorted order.
 */
public interface TreeListItem {

    /**
     * Get the item index.
     *
     * Item index is used to store the items in sorted order.
     *
     * @return The item index..
     */
    long getIndex();

    /**
     * Get the item size.
     *
     * Item size is used to determine overlapping addresses.
     *
     * @return The item size.
     */
    long getSize();
}


================================================
FILE: java/com/grammatech/gtirb/TreeListUtils.java
================================================
/*
 *  Copyright (C) 2020-2021 GrammaTech, Inc.
 *
 *  This code is licensed under the MIT license. See the LICENSE file in the
 *  project root for license terms.
 *
 *  This project is sponsored by the Office of Naval Research, One Liberty
 *  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
 *  N68335-17-C-0700.  The content of the information does not necessarily
 *  reflect the position or policy of the Government and no official
 *  endorsement should be inferred.
 *
 */

package com.grammatech.gtirb;

import java.util.ArrayList;
import java.util.Collections;
import java.util.Iterator;
import java.util.List;
import java.util.Set;
import java.util.SortedMap;
import java.util.TreeMap;

/**
 * Utilities for storing and retrieving generic items in sorted order.
 * Implementation is a TreeMap with nodes indexed by address
 * (or in some cases offset) where an address/offset is allowed to
 * have multiple items at the same index, and when multiple items have the
 * same index they are stored as an ArrayList.
 */
public class TreeListUtils<Type> implements Iterable<Type> {

    private TreeMap<Long, List<Type>> treeMap;

    public TreeListUtils(TreeMap<Long, List<Type>> treeMap) {
        this.treeMap = treeMap;
    }

    /**
     * Generic method for inserting items into a TreeList.
     *
     * @param item    The item to be added.
     * @param tree    The tree to be inserted into.
     * @return The updated tree node.
     */
    public static <T extends TreeListItem> List<T>
    insertItem(T item, TreeMap<Long, List<T>> tree) {
        Long index = item.getIndex();
        List<T> itemList;
        if (tree.containsKey(index))
            itemList = tree.get(index);
        else
            itemList = new ArrayList<T>();
        itemList.add(item);
        tree.put(index, itemList);
        return itemList;
    }

    /**
     * Generic method for removing items from a TreeList.
     *
     * @param item    The item to be removed.
     * @param tree    The tree to be removed from.
     * @return The updated tree node.
     */
    public static <T extends TreeListItem> List<T>
    removeItem(T item, TreeMap<Long, List<T>> tree) {
        Long index = item.getIndex();
        List<T> itemList = tree.get(index);
        if (itemList == null)
            // no blocks at this offset
            return null;
        if (!itemList.remove(item))
            // didn't remove, maybe no matching item?
            return null;
        // Did remove, update tree.
        // If the block list is now empty, remove the node from the tree.
        // Otherwise update the tree.
        if (itemList.size() == 0)
            tree.remove(index);
        else
            tree.put(index, itemList);
        // Return list, even if empty, because null means did not remove.
        return itemList;
    }

    /**
     * Generic method for retrieving items that intersect with a given address
     *
     * @param index    The address/offset to be matched.
     * @param tree     The tree to be matched in.
     * @return         A list of matching items.
     */
    public static <T extends TreeListItem> List<T>
    getItemsIntersectingIndex(long index, TreeMap<Long, List<T>> tree) {
        // Iterate through the tree nodes, but leave out those nodes who start
        // after the searched-for index.
        List<T> resultList = new ArrayList<T>();
        SortedMap<Long, List<T>> subTree = tree.headMap(index, true);
        for (List<T> itemList : subTree.values()) {
            for (T item : itemList) {
                long start = item.getIndex();
                long end = start + item.getSize();
                // Check if this item overlaps, including end points:
                //    item starts at or below this offset AND
                //    item ends at or above this offset
                // If so add it to the list.
                if (start <= index && end >= index) {
                    resultList.add(item);
                }
            }
        }
        return resultList;
    }

    /**
     * Generic method for retrieving items that intersect with a given address
     * range
     *
     * @param startIndex  The start of the address range to be matched.
     * @param endIndex    The end of the address range.
     * @param tree        The tree to be matched in.
     * @return            A list of matching items.
     */
    public static <T extends TreeListItem> List<T>
    getItemsIntersectingIndexRange(long startIndex, long endIndex,
                                   TreeMap<Long, List<T>> tree) {
        // Iterate through the tree nodes, but leave out those nodes who start
        // after the searched-for index.
        List<T> resultList = new ArrayList<T>();
        SortedMap<Long, List<T>> subTree = tree.headMap(endIndex, true);
        for (List<T> itemList : subTree.values()) {
            for (T item : itemList) {
                long start = item.getIndex();
                long end = start + item.getSize();
                // Check for overlap, including end points:
                //    (1) The range starts within the range of this interval:
                //        Item start is at or above the range start AND
                //        item start is at or below the range end
                // OR (2) The range ends within the range of this interval:
                //        Item end is at or above the range start AND
                //        item end is at or below the range end
                // OR (3) The range includes the range of this interval
                //        Item start is below range start AND
                //        item end is above range end
                // If so add it to the list to return.
                if (startIndex >= start && startIndex <= end)
                    resultList.add(item);
                else if (endIndex >= start && endIndex <= end)
                    resultList.add(item);
                else if (startIndex < start && endIndex > end)
                    resultList.add(item);
            }
        }
        return resultList;
    }

    /**
     * Generic method for retrieving items that start at a given address.
     *
     * @param index       The address to be matched.
     * @param tree        The tree to be matched in.
     * @return            A list of matching items.
     */
    public static <T extends TreeListItem> List<T>
    getItemsAtStartIndex(long index, TreeMap<Long, List<T>> tree) {
        List<T> resultList = new ArrayList<T>();
        if (tree.containsKey(index))
            resultList.addAll(tree.get(index));
        return (resultList);
    }

    /**
     * Generic method for retrieving items that start at a given address range.
     *
     * @param startIndex  The start of the address range to be matched.
     *     (inclusive)
     * @param endIndex    The end of the address range. (exclusive)
     * @param tree        The tree to be matched in.
     * @return            A list of matching items.
     */
    public static <T extends TreeListItem> List<T>
    getItemsAtStartIndexRange(long startIndex, long endIndex,
                              TreeMap<Long, List<T>> tree) {
        ArrayList<T> resultList = new ArrayList<T>();

        // First key in range can be found with ceilingKey()
        // Successive keys, if there are any, can be found with higherKey()
        Long key = tree.ceilingKey(startIndex);
        if (key != null && key < endIndex) {
            resultList.addAll(tree.get(key));
            key = tree.higherKey(key);
        }

        // Keep adding as long as you find items in range
        while (key != null && key < endIndex) {
            resultList.addAll(tree.get(key));
            key = tree.higherKey(key);
        }
        return resultList;
    }

    /**
     * Generic method for iterating through all items.
     *
     * @return An iterator for the tree.
     */
    @Override
    public Iterator<Type> iterator() {
        Iterator<Type> it = new Iterator<Type>() {
            private int treeSize = treeMap.size();
            private int currentTreeIndex = 0;
            private int currentListIndex = 0;
            // Get the (current set of keys for the whole tree, as an array of
            // Longs, so that it can be incremented through
            private Set<Long> keySet = treeMap.keySet();
            private Long keyArray[] = keySet.toArray(new Long[0]);

            // We need a currentList variable in this scope, but it the tree may
            // be empty, so we can't initialize it here. So set it to emptyList,
            // which will report a size of 0.
            private List<Type> currentList = Collections.emptyList();

            private boolean listHasNext() {
                if (currentList.size() > 0 &&
                    currentListIndex < currentList.size())
                    return true;
                return false;
            }

            private boolean treeHasNext() {
                if (keySet.size() > 0 && currentTreeIndex < keySet.size())
                    return true;
                return false;
            }

            @Override
            public boolean hasNext() {
                if (treeSize == 0)
                    return false;
                if (listHasNext() || treeHasNext())
                    return true;
                return false;
            }

            @Override
            public Type next() {
                if (treeSize == 0)
                    return null;
                if (listHasNext())
                    return currentList.get(currentListIndex++);
                else if (treeHasNext()) {
                    currentList = treeMap.get(keyArray[currentTreeIndex++]);
                    currentListIndex = 0;
                    return currentList.get(currentListIndex++);
                }
                return null;
            }

            @Override
            public void remove() {
                throw new UnsupportedOperationException();
            }
        };
        return it;
    }
}


================================================
FILE: java/com/grammatech/gtirb/TypeTableEntry.java
================================================
package com.grammatech.gtirb;

import com.grammatech.gtirb.tuple.Tuple1;
import com.grammatech.gtirb.tuple.Tuple2;
import com.grammatech.gtirb.variant.Token;
import com.grammatech.gtirb.variant.Variant11;
import java.util.List;
import java.util.Optional;
import java.util.UUID;

/**
 * A variant representing type information for an object.
 */
public class TypeTableEntry
    extends Variant11<Long, TypeTableEntry.BoolType, TypeTableEntry.IntType,
                      Long, Long, TypeTableEntry.FunctionType, UUID,
                      TypeTableEntry.ArrayType, UUID, TypeTableEntry.StructType,
                      TypeTableEntry.VoidType> {

    /**
     * A marker type representing the type bool.
     */
    public static class BoolType extends Tuple1<Byte> {
        /**
         * Constructor.
         *
         * Note that this tuple's byte is defined to always be 0.
         */
        public BoolType(Byte b) { super((byte)0); }
    }

    /**
     * A marker type representing the type int.
     */
    public static class IntType extends Tuple2<Byte, Long> {
        /**
         * Constructor.
         *
         * @param signedness Whether or not the type is signed (1 - signed, 0 -
         *     unsigned).
         * @param width Number of bytes the type is implemented with.
         */
        public IntType(Byte signedness, Long width) {
            super(signedness, width);
        }

        /**
         * True if the type is signed.
         */
        public boolean isSigned() { return this.get0() == 1; }

        /**
         * Get the width.
         */
        public Long getWidth() { return this.get1(); }
    }

    /**
     * A marker type for representing function types.
     */
    public static class FunctionType extends Tuple2<UUID, List<UUID>> {
        /**
         * Constructor.
         *
         * @param returnType The UUID of the return type.
         * @param paramTypes The types of the parameters.
         */
        public FunctionType(UUID returnType, List<UUID> paramTypes) {
            super(returnType, paramTypes);
        }

        /**
         * Get the return type UUID.
         */
        public UUID getReturnType() { return this.get0(); }

        /**
         * Get the types of the parameters.
         */
        public List<UUID> getParamTypes() { return this.get1(); }
    }

    /**
     * A marker type for representing array types.
     */
    public static class ArrayType extends Tuple2<UUID, Long> {
        /**
         * Constructor.
         *
         * @param elemType The type of the elements of the array.
         * @param size The size of the array.
         */
        public ArrayType(UUID elemType, Long size) { super(elemType, size); }

        /**
         * Get the element type UUID.
         */
        public UUID getElemType() { return this.get0(); }

        /**
         * Get the size of the array type.
         */
        public Long getSize() { return this.get1(); }
    }

    /**
     * A tuple representing a structure field.
     */
    public static class StructField extends Tuple2<Long, UUID> {
        /**
         * Constructor.
         *
         * @param offset The offset within the struct this field is at.
         * @param type The UUID of the type stored in this field.
         */
        public StructField(Long offset, UUID type) { super(offset, type); }

        /**
         * Get the offset of the field.
         */
        public Long getOffset() { return this.get0(); }

        /**
         * Get the type of the field.
         */
        public UUID getType() { return this.get1(); }
    }

    /**
     * A marker type for representing structure types.
     */
    public static class StructType extends Tuple2<Long, List<StructField>> {
        /**
         * Constructor.
         *
         * @param size The total size of the struct.
         * @param fields The list of fields in the struct.
         */
        public StructType(Long size, List<StructField> fields) {
            super(size, fields);
        }

        /**
         * Get the total size of the struct.
         */
        public Long getSize() { return this.get0(); }

        /**
         * Get the fields of the struct.
         */
        public List<StructField> getFields() { return this.get1(); }
    }

    /**
     * A marker type representing the type void.
     */
    public static class VoidType extends Tuple1<Byte> {
        /**
         * Constructor.
         *
         * Note that this tuple's byte is defined to always be 0.
         */
        public VoidType(Byte b) { super((byte)0); }
    }

    /* Hidden constructors */
    private TypeTableEntry(Token.T0 tok, Long v) { super(tok, v); }
    private TypeTableEntry(Token.T1 tok, BoolType v) { super(tok, v); }
    private TypeTableEntry(Token.T2 tok, IntType v) { super(tok, v); }
    private TypeTableEntry(Token.T3 tok, Long v) { super(tok, v); }
    private TypeTableEntry(Token.T4 tok, Long v) { super(tok, v); }
    private TypeTableEntry(Token.T5 tok, FunctionType v) { super(tok, v); }
    private TypeTableEntry(Token.T6 tok, UUID v) { super(tok, v); }
    private TypeTableEntry(Token.T7 tok, ArrayType v) { super(tok, v); }
    private TypeTableEntry(Token.T8 tok, UUID v) { super(tok, v); }
    private TypeTableEntry(Token.T9 tok, StructType v) { super(tok, v); }
    private TypeTableEntry(Token.T10 tok, VoidType v) { super(tok, v); }

    /**
     * Get the size of an unknown type.
     */
    public Optional<Long> getSizeIfUnknown() { return this.get0(); }

    /**
     * Returns whether or not the type is a bool type.
     */
    public boolean isBool() { return this.get1().isPresent(); }

    /**
     * Get the IntType tuple if this is an int type.
     */
    public Optional<IntType> getAsInt() { return this.get2(); }

    /**
     * Get the size of a char type.
     */
    public Optional<Long> getSizeIfChar() { return this.get3(); }

    /**
     * Get the size of a float type.
     */
    public Optional<Long> getSizeIfFloat() { return this.get4(); }

    /**
     * Get the FunctionType tuple if this is a function type.
     */
    public Optional<FunctionType> getAsFunction() { return this.get5(); }

    /**
     * Get the UUID of the pointed-to type if this is a pointer type.
     */
    public Optional<UUID> getUuidIfPointer() { return this.get6(); }

    /**
     * Get the ArrayType tuple if this is an array type.
     */
    public Optional<ArrayType> getAsArray() { return this.get7(); }

    /**
     * Get the UUID of the aliased type if this is an alias type.
     */
    public Optional<UUID> getUuidIfAlias() { return this.get8(); }

    /**
     * Get the StructType tuple if this is a struct type.
     */
    public Optional<StructType> getAsStruct() { return this.get9(); }

    /**
     * Returns true if this is a void type.
     */
    public boolean isVoid() { return this.get10().isPresent(); }

    /**
     * Factory for unknown type.
     */
    public static TypeTableEntry makeUnknown(Long size) {
        return new TypeTableEntry(new Token.T0(), size);
    }

    /**
     * Factory for bool type.
     */
    public static TypeTableEntry makeBool(BoolType boolType) {
        return new TypeTableEntry(new Token.T1(), boolType);
    }

    /**
     * Factory for int type.
     */
    public static TypeTableEntry makeInt(IntType intType) {
        return new TypeTableEntry(new Token.T2(), intType);
    }

    /**
     * Factory for char type.
     */
    public static TypeTableEntry makeChar(Long size) {
        return new TypeTableEntry(new Token.T3(), size);
    }

    /**
     * Factory for float type.
     */
    public static TypeTableEntry makeFloat(Long size) {
        return new TypeTableEntry(new Token.T4(), size);
    }

    /**
     * Factory for function type.
     */
    public static TypeTableEntry makeFunction(FunctionType funcType) {
        return new TypeTableEntry(new Token.T5(), funcType);
    }

    /**
     * Factory for pointer type.
     */
    public static TypeTableEntry makePointer(UUID pointedToType) {
        return new TypeTableEntry(new Token.T6(), pointedToType);
    }

    /**
     * Factory for array type.
     */
    public static TypeTableEntry makeArray(ArrayType arrType) {
        return new TypeTableEntry(new Token.T7(), arrType);
    }

    /**
     * Factory for alias type.
     */
    public static TypeTableEntry makeAlias(UUID aliasedType) {
        return new TypeTableEntry(new Token.T8(), aliasedType);
    }

    /**
     * Factory for struct type.
     */
    public static TypeTableEntry makeStruct(StructType structType) {
        return new TypeTableEntry(new Token.T9(), structType);
    }

    /**
     * Factory for void type.
     */
    public static TypeTableEntry makeVoid(VoidType voidType) {
        return new TypeTableEntry(new Token.T10(), voidType);
    }
}


================================================
FILE: java/com/grammatech/gtirb/Util.java
================================================
/*
 *  Copyright (C) 2020-2021 GrammaTech, Inc.
 *
 *  This code is licensed under the MIT license. See the LICENSE file in the
 *  project root for license terms.
 *
 *  This project is sponsored by the Office of Naval Research, One Liberty
 *  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
 *  N68335-17-C-0700.  The content of the information does not necessarily
 *  reflect the position or policy of the Government and no official
 *  endorsement should be inferred.
 *
 */

package com.grammatech.gtirb;

import com.google.protobuf.ByteString;
import java.io.EOFException;
import java.io.IOException;
import java.io.InputStream;
import java.io.OutputStream;
import java.lang.IllegalArgumentException;
import java.nio.ByteBuffer;
import java.nio.ByteOrder;
import java.util.UUID;

/**
 * General purpose methods.
 */
public class Util {

    public static final UUID NIL_UUID = new UUID(0, 0);
    public static final long NIL_ADDR = 0;

    /**
     * Converts a 16-byte array into a UUID.
     *
     * @param b The byte array.
     * @return The resulting UUID.
     */
    public static UUID byteArrayToUUID(byte[] b)
        throws IllegalArgumentException {
        if (b.length != 16) {
            throw new IllegalArgumentException("b.length() != 16");
        }
        ByteBuffer bb = ByteBuffer.wrap(b);
        bb.order(ByteOrder.LITTLE_ENDIAN);
        return new UUID(bb.getLong(), bb.getLong());
    }

    /**
     * Reads a UUID from an InputStream.
     *
     * @param in The stream to read from.
     * @return The UUID read.
     */
    public static UUID readUUID(InputStream in) throws IOException {
        byte[] b = new byte[16];
        if (in.read(b, 0, 16) != 16) {
            throw new EOFException("Insufficient bytes to read a UUID from.");
        }
        try {
            return byteArrayToUUID(b);
        } catch (IllegalArgumentException e) {
            // Should never happen.
            throw new RuntimeException(
                "byteArrayToUUID() and readUUID using inconsistent buffer sizes!");
        }
    }

    /**
     * Convert a ByteString to a UUID.
     *
     * @param byteString  The byte string.
     * @return            A UUID having the value retrieved from the byte
     * string.
     */
    public static UUID
    byteStringToUuid(com.google.protobuf.ByteString byteString)
        throws IOException {
        if (byteString == com.google.protobuf.ByteString.EMPTY) {
            return new UUID(0, 0);
        }
        byte[] uuidByteArray = byteString.toByteArray();
        try {
            return byteArrayToUUID(uuidByteArray);
        } catch (IllegalArgumentException e) {
            throw new IOException(
                "Protobuf ByteString has insufficient length for a UUID!");
        }
    }

    /**
     * Converts a UUID to a 16-byte array
     *
     * @param uuid The uuid to convert.
     * @return The resulting 16-byte array.
     */
    public static byte[] uuidToByteArray(UUID uuid) {
        byte[] ba = new byte[16];
        ByteBuffer bb = ByteBuffer.wrap(ba);
        bb.order(ByteOrder.LITTLE_ENDIAN);
        bb.putLong(uuid.getMostSignificantBits());
        bb.putLong(uuid.getLeastSignificantBits());
        return ba;
    }

    /**
     * Writes a UUID to an OutputStream
     *
     * @param out The stream to write to.
     */
    public static void writeUUID(OutputStream out, UUID uuid)
        throws IOException {
        byte[] b = uuidToByteArray(uuid);
        out.write(b, 0, 16);
    }

    /**
     * Convert a UUID to a ByteString.
     *
     * @param uuid  The UUID.
     * @return      A ByteString storing the value of the UUID.
     */
    public static com.google.protobuf.ByteString uuidToByteString(UUID uuid) {
        return ByteString.copyFrom(uuidToByteArray(uuid));
    }
}


================================================
FILE: java/com/grammatech/gtirb/auxdatacodec/BoolCodec.java
================================================
/*
 *  Copyright (C) 2022 GrammaTech, Inc.
 *
 *  This code is licensed under the MIT license. See the LICENSE file in the
 *  project root for license terms.
 *
 *  This project is sponsored by the Office of Naval Research, One Liberty
 *  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
 *  N68335-17-C-0700.  The content of the information does not necessarily
 *  reflect the position or policy of the Government and no official
 *  endorsement should be inferred.
 *
 */

package com.grammatech.gtirb.auxdatacodec;

import java.io.EOFException;
import java.io.IOException;
import java.io.InputStream;
import java.io.OutputStream;

/**
 * A Codec for bool.
 */
public class BoolCodec implements Codec<Boolean> {

    public String getTypeName() { return "bool"; }

    public Boolean decode(InputStream in) throws IOException {
        byte[] b = new byte[1];
        if (in.read(b, 0, 1) != 1) {
            throw new EOFException(
                "Insufficient bytes to read a Boolean from.");
        }
        return Boolean.valueOf(b[0] != 0);
    }

    public void encode(OutputStream out, Boolean val) throws IOException {
        out.write((byte)(val ? 1 : 0));
    }
}


================================================
FILE: java/com/grammatech/gtirb/auxdatacodec/ByteCodec.java
================================================
package com.grammatech.gtirb.auxdatacodec;

import java.io.EOFException;
import java.io.IOException;
import java.io.InputStream;
import java.io.OutputStream;

public class ByteCodec implements Codec<Byte> {

    private String typeName;

    private ByteCodec(String tn) { this.typeName = tn; }

    public String getTypeName() { return this.typeName; }

    public Byte decode(InputStream in) throws IOException {
        byte[] b = new byte[1];
        if (in.read(b, 0, 1) != 1) {
            throw new EOFException("Insufficient bytes to read a Byte from.");
        }
        return b[0];
    }

    public void encode(OutputStream out, Byte val) throws IOException {
        byte[] b = new byte[1];
        b[0] = val;
        out.write(b, 0, 1);
    }

    public final static ByteCodec INT8 = new ByteCodec("int8_t");
    public final static ByteCodec UINT8 = new ByteCodec("uint8_t");
}


================================================
FILE: java/com/grammatech/gtirb/auxdatacodec/Codec.java
================================================
/*
 *  Copyright (C) 2020-2021 GrammaTech, Inc.
 *
 *  This code is licensed under the MIT license. See the LICENSE file in the
 *  project root for license terms.
 *
 *  This project is sponsored by the Office of Naval Research, One Liberty
 *  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
 *  N68335-17-C-0700.  The content of the information does not necessarily
 *  reflect the position or policy of the Government and no official
 *  endorsement should be inferred.
 *
 */

package com.grammatech.gtirb.auxdatacodec;

import java.io.IOException;
import java.io.InputStream;
import java.io.OutputStream;

/**
 * A codec is an object that knows how to encode and decode AuxData objects.
 */
public interface Codec<T> {

    /**
     * Gets the portable name for the type used in protobuf.
     *
     * @return The name of the type.
     */
    public String getTypeName();

    /**
     * Decode a serialized instance into an in-memory object of type T.
     *
     * @param in The input stream the object is to be decoded from.
     * @return The decoded object.
     */
    public T decode(InputStream in) throws IOException;

    /**
     * Encode an in-memory object into serialized form.
     *
     * @param out The output stream to send the serialized object to.
     * @param val The in-memory object to be serialized.
     */
    public void encode(OutputStream out, T val) throws IOException;
}


================================================
FILE: java/com/grammatech/gtirb/auxdatacodec/FloatCodec.java
================================================
/*
 *  Copyright (C) 2020-2021 GrammaTech, Inc.
 *
 *  This code is licensed under the MIT license. See the LICENSE file in the
 *  project root for license terms.
 *
 *  This project is sponsored by the Office of Naval Research, One Liberty
 *  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
 *  N68335-17-C-0700.  The content of the information does not necessarily
 *  reflect the position or policy of the Government and no official
 *  endorsement should be inferred.
 *
 */

package com.grammatech.gtirb.auxdatacodec;

import java.io.EOFException;
import java.io.IOException;
import java.io.InputStream;
import java.io.OutputStream;
import java.nio.ByteBuffer;
import java.nio.ByteOrder;

public class FloatCodec implements Codec<Float> {

    public String getTypeName() { return "float"; }

    public Float decode(InputStream in) throws IOException {
        byte[] b = new byte[4];
        if (in.read(b, 0, 4) != 4) {
            throw new EOFException("Insufficient bytes to read a Float from.");
        }
        ByteBuffer bb = ByteBuffer.wrap(b);
        bb.order(ByteOrder.LITTLE_ENDIAN);
        return bb.getFloat();
    }

    public void encode(OutputStream out, Float val) throws IOException {
        byte[] b = new byte[4];
        ByteBuffer bb = ByteBuffer.wrap(b);
        bb.order(ByteOrder.LITTLE_ENDIAN);
        bb.putFloat(val);
        out.write(b, 0, 4);
    }
}


================================================
FILE: java/com/grammatech/gtirb/auxdatacodec/IntegerCodec.java
================================================
/*
 *  Copyright (C) 2020-2021 GrammaTech, Inc.
 *
 *  This code is licensed under the MIT license. See the LICENSE file in the
 *  project root for license terms.
 *
 *  This project is sponsored by the Office of Naval Research, One Liberty
 *  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
 *  N68335-17-C-0700.  The content of the information does not necessarily
 *  reflect the position or policy of the Government and no official
 *  endorsement should be inferred.
 *
 */

package com.grammatech.gtirb.auxdatacodec;

import java.io.EOFException;
import java.io.IOException;
import java.io.InputStream;
import java.io.OutputStream;
import java.nio.ByteBuffer;
import java.nio.ByteOrder;

public class IntegerCodec implements Codec<Integer> {

    private String typeName;

    private IntegerCodec(String tn) { this.typeName = tn; }

    public String getTypeName() { return this.typeName; }

    public Integer decode(InputStream in) throws IOException {
        byte[] b = new byte[4];
        if (in.read(b, 0, 4) != 4) {
            throw new EOFException(
                "Insufficient bytes to read an Integer from.");
        }
        ByteBuffer bb = ByteBuffer.wrap(b);
        bb.order(ByteOrder.LITTLE_ENDIAN);
        return bb.getInt();
    }

    public void encode(OutputStream out, Integer val) throws IOException {
        byte[] b = new byte[4];
        ByteBuffer bb = ByteBuffer.wrap(b);
        bb.order(ByteOrder.LITTLE_ENDIAN);
        bb.putInt(val);
        out.write(b, 0, 4);
    }

    public final static IntegerCodec INT32 = new IntegerCodec("int32_t");
    public final static IntegerCodec UINT32 = new IntegerCodec("uint32_t");
}


================================================
FILE: java/com/grammatech/gtirb/auxdatacodec/ListCodec.java
================================================
/*
 *  Copyright (C) 2020-2021 GrammaTech, Inc.
 *
 *  This code is licensed under the MIT license. See the LICENSE file in the
 *  project root for license terms.
 *
 *  This project is sponsored by the Office of Naval Research, One Liberty
 *  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
 *  N68335-17-C-0700.  The content of the information does not necessarily
 *  reflect the position or policy of the Government and no official
 *  endorsement should be inferred.
 *
 */

package com.grammatech.gtirb.auxdatacodec;

import java.io.IOException;
import java.io.InputStream;
import java.io.OutputStream;
import java.util.List;
import java.util.function.Supplier;

public class ListCodec<T> implements Codec<List<T>> {
    private Codec<T> tCodec;
    private Supplier<List<T>> sup;

    public ListCodec(Codec<T> tc, Supplier<List<T>> s) {
        this.tCodec = tc;
        this.sup = s;
    }

    public String getTypeName() {
        return "sequence<" + this.tCodec.getTypeName() + ">";
    }

    public List<T> decode(InputStream in) throws IOException {
        List<T> al = this.sup.get();
        long len = LongCodec.decodeStatic(in);

        for (int i = 0; i < len; i++)
            al.add(this.tCodec.decode(in));
        return al;
    }

    public void encode(OutputStream out, List<T> al) throws IOException {
        LongCodec.encodeStatic(out, (long)al.size());
        for (T item : al) {
            this.tCodec.encode(out, item);
        }
    }
}


================================================
FILE: java/com/grammatech/gtirb/auxdatacodec/LongCodec.java
================================================
/*
 *  Copyright (C) 2020-2021 GrammaTech, Inc.
 *
 *  This code is licensed under the MIT license. See the LICENSE file in the
 *  project root for license terms.
 *
 *  This project is sponsored by the Office of Naval Research, One Liberty
 *  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
 *  N68335-17-C-0700.  The content of the information does not necessarily
 *  reflect the position or policy of the Government and no official
 *  endorsement should be inferred.
 *
 */

package com.grammatech.gtirb.auxdatacodec;

import java.io.EOFException;
import java.io.IOException;
import java.io.InputStream;
import java.io.OutputStream;
import java.nio.ByteBuffer;
import java.nio.ByteOrder;

public class LongCodec implements Codec<Long> {

    private String typeName;

    private LongCodec(String tn) { this.typeName = tn; }

    public String getTypeName() { return this.typeName; }

    public static long decodeStatic(InputStream in) throws IOException {
        byte[] b = new byte[8];
        if (in.read(b, 0, 8) != 8) {
            throw new EOFException("Insufficient bytes to read a Long from.");
        }
        ByteBuffer bb = ByteBuffer.wrap(b);
        bb.order(ByteOrder.LITTLE_ENDIAN);
        return bb.getLong();
    }

    public Long decode(InputStream in) throws IOException {
        return new Long(decodeStatic(in));
    }

    public static void encodeStatic(OutputStream out, long val)
        throws IOException {
        byte[] b = new byte[8];
        ByteBuffer bb = ByteBuffer.wrap(b);
        bb.order(ByteOrder.LITTLE_ENDIAN);
        bb.putLong(val);
        out.write(b, 0, 8);
    }

    public void encode(OutputStream out, Long val) throws IOException {
        encodeStatic(out, val);
    }

    public final static LongCodec INT64 = new LongCodec("int64_t");
    public final static LongCodec UINT64 = new LongCodec("uint64_t");
}


================================================
FILE: java/com/grammatech/gtirb/auxdatacodec/MapCodec.java
================================================
/*
 *  Copyright (C) 2020-2021 GrammaTech, Inc.
 *
 *  This code is licensed under the MIT license. See the LICENSE file in the
 *  project root for license terms.
 *
 *  This project is sponsored by the Office of Naval Research, One Liberty
 *  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
 *  N68335-17-C-0700.  The content of the information does not necessarily
 *  reflect the position or policy of the Government and no official
 *  endorsement should be inferred.
 *
 */

package com.grammatech.gtirb.auxdatacodec;

import java.io.IOException;
import java.io.InputStream;
import java.io.OutputStream;
import java.util.Map;
import java.util.function.Supplier;

public class MapCodec<K, V> implements Codec<Map<K, V>> {
    private Codec<K> kCodec;
    private Codec<V> vCodec;
    private Supplier<Map<K, V>> sup;

    public MapCodec(Codec<K> kc, Codec<V> vc, Supplier<Map<K, V>> s) {
        this.kCodec = kc;
        this.vCodec = vc;
        this.sup = s;
    }

    public String getTypeName() {
        return "mapping<" + kCodec.getTypeName() + "," + vCodec.getTypeName() +
            ">";
    }

    public Map<K, V> decode(InputStream in) throws IOException {
        Map<K, V> map = this.sup.get();

        // Size of the map.
        long len = LongCodec.decodeStatic(in);

        // All the entries.
        for (int i = 0; i < len; i++) {
            K key = this.kCodec.decode(in);
            V val = this.vCodec.decode(in);
            map.put(key, val);
        }
        return map;
    }

    public void encode(OutputStream out, Map<K, V> map) throws IOException {
        // Size of the map.
        LongCodec.encodeStatic(out, (long)map.size());

        // All the entries.
        for (Map.Entry<K, V> entry : map.entrySet()) {
            this.kCodec.encode(out, entry.getKey());
            this.vCodec.encode(out, entry.getValue());
        }
    }
}


================================================
FILE: java/com/grammatech/gtirb/auxdatacodec/OffsetCodec.java
================================================
/*
 *  Copyright (C) 2020-2021 GrammaTech, Inc.
 *
 *  This code is licensed under the MIT license. See the LICENSE file in the
 *  project root for license terms.
 *
 *  This project is sponsored by the Office of Naval Research, One Liberty
 *  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
 *  N68335-17-C-0700.  The content of the information does not necessarily
 *  reflect the position or policy of the Government and no official
 *  endorsement should be inferred.
 *
 */

package com.grammatech.gtirb.auxdatacodec;

import com.grammatech.gtirb.Offset;
import java.io.IOException;
import java.io.InputStream;
import java.io.OutputStream;
import java.util.UUID;

public class OffsetCodec implements Codec<Offset> {

    public String getTypeName() { return "Offset"; }

    public Offset decode(InputStream in) throws IOException {
        UUID uuid = UuidCodec.decodeStatic(in);
        long disp = LongCodec.decodeStatic(in);
        return new Offset(uuid, disp);
    }

    public void encode(OutputStream out, Offset val) throws IOException {
        UuidCodec.encodeStatic(out, val.getElementId());
        LongCodec.encodeStatic(out, val.getDisplacement());
    }
}


================================================
FILE: java/com/grammatech/gtirb/auxdatacodec/SetCodec.java
================================================
/*
 *  Copyright (C) 2020-2021 GrammaTech, Inc.
 *
 *  This code is licensed under the MIT license. See the LICENSE file in the
 *  project root for license terms.
 *
 *  This project is sponsored by the Office of Naval Research, One Liberty
 *  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
 *  N68335-17-C-0700.  The content of the information does not necessarily
 *  reflect the position or policy of the Government and no official
 *  endorsement should be inferred.
 *
 */

package com.grammatech.gtirb.auxdatacodec;

import java.io.IOException;
import java.io.InputStream;
import java.io.OutputStream;
import java.util.Set;
import java.util.function.Supplier;

public class SetCodec<T> implements Codec<Set<T>> {
    private Codec<T> tCodec;
    private Supplier<Set<T>> sup;

    public SetCodec(Codec<T> tc, Supplier<Set<T>> s) {
        this.tCodec = tc;
        this.sup = s;
    }

    public String getTypeName() {
        return "set<" + this.tCodec.getTypeName() + ">";
    }

    public Set<T> decode(InputStream in) throws IOException {
        Set<T> set = this.sup.get();

        // Size of the set.
        long len = LongCodec.decodeStatic(in);

        // All the entries.
        for (int i = 0; i < len; i++) {
            T item = this.tCodec.decode(in);
            set.add(item);
        }
        return set;
    }

    public void encode(OutputStream out, Set<T> set) throws IOException {
        // Size of the set.
        LongCodec.encodeStatic(out, (long)set.size());

        for (T item : set) {
            this.tCodec.encode(out, item);
        }
    }
}


================================================
FILE: java/com/grammatech/gtirb/auxdatacodec/ShortCodec.java
================================================
package com.grammatech.gtirb.auxdatacodec;

import java.io.EOFException;
import java.io.IOException;
import java.io.InputStream;
import java.io.OutputStream;
import java.nio.ByteBuffer;
import java.nio.ByteOrder;

public class ShortCodec implements Codec<Short> {

    private String typeName;

    private ShortCodec(String tn) { this.typeName = tn; }

    public String getTypeName() { return this.typeName; }

    public Short decode(InputStream in) throws IOException {
        byte[] b = new byte[2];
        if (in.read(b, 0, 2) != 2) {
            throw new EOFException("Insufficient bytes to read a Short from.");
        }
        ByteBuffer bb = ByteBuffer.wrap(b);
        bb.order(ByteOrder.LITTLE_ENDIAN);
        return bb.getShort();
    }

    public void encode(OutputStream out, Short val) throws IOException {
        byte[] b = new byte[2];
        ByteBuffer bb = ByteBuffer.wrap(b);
        bb.order(ByteOrder.LITTLE_ENDIAN);
        bb.putShort(val);
        out.write(b, 0, 2);
    }

    public final static ShortCodec INT16 = new ShortCodec("int16_t");
    public final static ShortCodec UINT16 = new ShortCodec("uint16_t");
}


================================================
FILE: java/com/grammatech/gtirb/auxdatacodec/StringCodec.java
================================================
/*
 *  Copyright (C) 2020-2021 GrammaTech, Inc.
 *
 *  This code is licensed under the MIT license. See the LICENSE file in the
 *  project root for license terms.
 *
 *  This project is sponsored by the Office of Naval Research, One Liberty
 *  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
 *  N68335-17-C-0700.  The content of the information does not necessarily
 *  reflect the position or policy of the Government and no official
 *  endorsement should be inferred.
 *
 */

package com.grammatech.gtirb.auxdatacodec;

import java.io.EOFException;
import java.io.IOException;
import java.io.InputStream;
import java.io.OutputStream;
import java.nio.charset.StandardCharsets;

/**
 * A Codec for strings.
 */
public class StringCodec implements Codec<String> {

    public String getTypeName() { return "string"; }

    public String decode(InputStream in) throws IOException {
        int length = (int)LongCodec.decodeStatic(in);
        if (length == 0) {
            return "";
        }
        byte[] strBytes = new byte[length];
        if (in.read(strBytes, 0, length) != length) {
            throw new EOFException(
                "Insufficient bytes to read expected String length.");
        }

        return new String(strBytes, StandardCharsets.UTF_8);
    }

    public void encode(OutputStream out, String val) throws IOException {
        byte[] strBytes = val.getBytes(StandardCharsets.UTF_8);
        LongCodec.encodeStatic(out, (long)strBytes.length);
        out.write(strBytes, 0, strBytes.length);
    }
}


================================================
FILE: java/com/grammatech/gtirb/auxdatacodec/Tuple1Codec.java
================================================
package com.grammatech.gtirb.auxdatacodec;

import com.grammatech.gtirb.tuple.Tuple1;
import java.io.IOException;
import java.io.InputStream;
import java.io.OutputStream;

public class Tuple1Codec<T extends Tuple1<A>, A> implements Codec<T> {
    private Codec<A> aCodec;

    private Tuple1Maker<T, A> maker;

    public interface Tuple1Maker<T, A> { public T make(A a); }

    public Tuple1Codec(Codec<A> ac, Tuple1Maker<T, A> maker) {
        this.aCodec = ac;
        this.maker = maker;
    }

    public String getTypeName() {
        return "tuple<" + aCodec.getTypeName() + ">";
    }

    public T decode(InputStream in) throws IOException {
        A a = this.aCodec.decode(in);
        return this.maker.make(a);
    }

    public void encode(OutputStream out, T val) throws IOException {
        this.aCodec.encode(out, val.get0());
    }
}


================================================
FILE: java/com/grammatech/gtirb/auxdatacodec/Tuple2Codec.java
================================================
/*
 *  Copyright (C) 2020-2021 GrammaTech, Inc.
 *
 *  This code is licensed under the MIT license. See the LICENSE file in the
 *  project root for license terms.
 *
 *  This project is sponsored by the Office of Naval Research, One Liberty
 *  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
 *  N68335-17-C-0700.  The content of the information does not necessarily
 *  reflect the position or policy of the Government and no official
 *  endorsement should be inferred.
 *
 */

package com.grammatech.gtirb.auxdatacodec;

import com.grammatech.gtirb.tuple.Tuple2;
import java.io.IOException;
import java.io.InputStream;
import java.io.OutputStream;

public class Tuple2Codec<T extends Tuple2<A, B>, A, B> implements Codec<T> {
    private Codec<A> aCodec;
    private Codec<B> bCodec;

    private Tuple2Maker<T, A, B> maker;

    public interface Tuple2Maker<T, A, B> { public T make(A a, B b); }

    public Tuple2Codec(Codec<A> ac, Codec<B> bc, Tuple2Maker<T, A, B> maker) {
        this.aCodec = ac;
        this.bCodec = bc;
        this.maker = maker;
    }

    public String getTypeName() {
        return "tuple<" + aCodec.getTypeName() + "," + bCodec.getTypeName() +
            ">";
    }

    public T decode(InputStream in) throws IOException {
        A a = this.aCodec.decode(in);
        B b = this.bCodec.decode(in);
        return this.maker.make(a, b);
    }

    public void encode(OutputStream out, T val) throws IOException {
        this.aCodec.encode(out, val.get0());
        this.bCodec.encode(out, val.get1());
    }
}


================================================
FILE: java/com/grammatech/gtirb/auxdatacodec/Tuple3Codec.java
================================================
/*
 *  Copyright (C) 2020-2021 GrammaTech, Inc.
 *
 *  This code is licensed under the MIT license. See the LICENSE file in the
 *  project root for license terms.
 *
 *  This project is sponsored by the Office of Naval Research, One Liberty
 *  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
 *  N68335-17-C-0700.  The content of the information does not necessarily
 *  reflect the position or policy of the Government and no official
 *  endorsement should be inferred.
 *
 */

package com.grammatech.gtirb.auxdatacodec;

import com.grammatech.gtirb.tuple.Tuple3;
import java.io.IOException;
import java.io.InputStream;
import java.io.OutputStream;

public class Tuple3Codec<T extends Tuple3<A, B, C>, A, B, C>
    implements Codec<T> {
    private Codec<A> aCodec;
    private Codec<B> bCodec;
    private Codec<C> cCodec;

    private Tuple3Maker<T, A, B, C> maker;

    public interface Tuple3Maker<T, A, B, C> { public T make(A a, B b, C c); }

    public Tuple3Codec(Codec<A> ac, Codec<B> bc, Codec<C> cc,
                       Tuple3Maker<T, A, B, C> maker) {
        this.aCodec = ac;
        this.bCodec = bc;
        this.cCodec = cc;
        this.maker = maker;
    }

    public String getTypeName() {
        return "tuple<" + aCodec.getTypeName() + "," + bCodec.getTypeName() +
            "," + cCodec.getTypeName() + ">";
    }

    public T decode(InputStream in) throws IOException {
        A a = this.aCodec.decode(in);
        B b = this.bCodec.decode(in);
        C c = this.cCodec.decode(in);
        return this.maker.make(a, b, c);
    }

    public void encode(OutputStream out, T val) throws IOException {
        this.aCodec.encode(out, val.get0());
        this.bCodec.encode(out, val.get1());
        this.cCodec.encode(out, val.get2());
    }
}


================================================
FILE: java/com/grammatech/gtirb/auxdatacodec/Tuple4Codec.java
================================================
/*
 *  Copyright (C) 2020-2021 GrammaTech, Inc.
 *
 *  This code is licensed under the MIT license. See the LICENSE file in the
 *  project root for license terms.
 *
 *  This project is sponsored by the Office of Naval Research, One Liberty
 *  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
 *  N68335-17-C-0700.  The content of the information does not necessarily
 *  reflect the position or policy of the Government and no official
 *  endorsement should be inferred.
 *
 */

package com.grammatech.gtirb.auxdatacodec;

import com.grammatech.gtirb.tuple.Tuple4;
import java.io.IOException;
import java.io.InputStream;
import java.io.OutputStream;

public class Tuple4Codec<T extends Tuple4<A, B, C, D>, A, B, C, D>
    implements Codec<T> {
    private Codec<A> aCodec;
    private Codec<B> bCodec;
    private Codec<C> cCodec;
    private Codec<D> dCodec;

    private Tuple4Maker<T, A, B, C, D> maker;

    public interface Tuple4Maker<T, A, B, C, D> {
        public T make(A a, B b, C c, D d);
    }

    public Tuple4Codec(Codec<A> ac, Codec<B> bc, Codec<C> cc, Codec<D> dc,
                       Tuple4Maker<T, A, B, C, D> maker) {
        this.aCodec = ac;
        this.bCodec = bc;
        this.cCodec = cc;
        this.dCodec = dc;
        this.maker = maker;
    }

    public String getTypeName() {
        return "tuple<" + aCodec.getTypeName() + "," + bCodec.getTypeName() +
            "," + cCodec.getTypeName() + "," + dCodec.getTypeName() + ">";
    }

    public T decode(InputStream in) throws IOException {
        A a = this.aCodec.decode(in);
        B b = this.bCodec.decode(in);
        C c = this.cCodec.decode(in);
        D d = this.dCodec.decode(in);
        return this.maker.make(a, b, c, d);
    }

    public void encode(OutputStream out, T val) throws IOException {
        this.aCodec.encode(out, val.get0());
        this.bCodec.encode(out, val.get1());
        this.cCodec.encode(out, val.get2());
        this.dCodec.encode(out, val.get3());
    }
}


================================================
FILE: java/com/grammatech/gtirb/auxdatacodec/Tuple5Codec.java
================================================
/*
 *  Copyright (C) 2020-2021 GrammaTech, Inc.
 *
 *  This code is licensed under the MIT license. See the LICENSE file in the
 *  project root for license terms.
 *
 *  This project is sponsored by the Office of Naval Research, One Liberty
 *  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
 *  N68335-17-C-0700.  The content of the information does not necessarily
 *  reflect the position or policy of the Government and no official
 *  endorsement should be inferred.
 *
 */

package com.grammatech.gtirb.auxdatacodec;

import com.grammatech.gtirb.tuple.Tuple5;
import java.io.IOException;
import java.io.InputStream;
import java.io.OutputStream;

public class Tuple5Codec<T extends Tuple5<A, B, C, D, E>, A, B, C, D, E>
    implements Codec<T> {
    private Codec<A> aCodec;
    private Codec<B> bCodec;
    private Codec<C> cCodec;
    private Codec<D> dCodec;
    private Codec<E> eCodec;

    private Tuple5Maker<T, A, B, C, D, E> maker;

    public interface Tuple5Maker<T, A, B, C, D, E> {
        public T make(A a, B b, C c, D d, E e);
    }

    public Tuple5Codec(Codec<A> ac, Codec<B> bc, Codec<C> cc, Codec<D> dc,
                       Codec<E> ec, Tuple5Maker<T, A, B, C, D, E> maker) {
        this.aCodec = ac;
        this.bCodec = bc;
        this.cCodec = cc;
        this.dCodec = dc;
        this.eCodec = ec;
        this.maker = maker;
    }

    public String getTypeName() {
        return "tuple<" + aCodec.getTypeName() + "," + bCodec.getTypeName() +
            "," + cCodec.getTypeName() + "," + dCodec.getTypeName() + "," +
            eCodec.getTypeName() + ">";
    }

    public T decode(InputStream in) throws IOException {
        A a = this.aCodec.decode(in);
        B b = this.bCodec.decode(in);
        C c = this.cCodec.decode(in);
        D d = this.dCodec.decode(in);
        E e = this.eCodec.decode(in);
        return this.maker.make(a, b, c, d, e);
    }

    public void encode(OutputStream out, T val) throws IOException {
        this.aCodec.encode(out, val.get0());
        this.bCodec.encode(out, val.get1());
        this.cCodec.encode(out, val.get2());
        this.dCodec.encode(out, val.get3());
        this.eCodec.encode(out, val.get4());
    }
}


================================================
FILE: java/com/grammatech/gtirb/auxdatacodec/UuidCodec.java
================================================
/*
 *  Copyright (C) 2020-2021 GrammaTech, Inc.
 *
 *  This code is licensed under the MIT license. See the LICENSE file in the
 *  project root for license terms.
 *
 *  This project is sponsored by the Office of Naval Research, One Liberty
 *  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
 *  N68335-17-C-0700.  The content of the information does not necessarily
 *  reflect the position or policy of the Government and no official
 *  endorsement should be inferred.
 *
 */

package com.grammatech.gtirb.auxdatacodec;

import com.grammatech.gtirb.Util;
import java.io.IOException;
import java.io.InputStream;
import java.io.OutputStream;
import java.util.UUID;

public class UuidCodec implements Codec<UUID> {

    public String getTypeName() { return "UUID"; }

    public static UUID decodeStatic(InputStream in) throws IOException {
        return Util.readUUID(in);
    }

    public UUID decode(InputStream in) throws IOException {
        return Util.readUUID(in);
    }

    public static void encodeStatic(OutputStream out, UUID val)
        throws IOException {
        Util.writeUUID(out, val);
    }

    public void encode(OutputStream out, UUID val) throws IOException {
        Util.writeUUID(out, val);
    }
}


================================================
FILE: java/com/grammatech/gtirb/auxdatacodec/Variant11Codec.java
================================================
package com.grammatech.gtirb.auxdatacodec;

import com.grammatech.gtirb.variant.Variant11;
import java.io.IOException;
import java.io.InputStream;
import java.io.OutputStream;

/**
 * A codec for serializing 3-element variants.
 */
public class Variant11Codec<
    T extends Variant11<A, B, C, D, E, F, G, H, I, J, K>, A, B, C, D, E, F, G,
              H, I, J, K> implements Codec<T> {
    private Codec<A> aCodec;
    private Codec<B> bCodec;
    private Codec<C> cCodec;
    private Codec<D> dCodec;
    private Codec<E> eCodec;
    private Codec<F> fCodec;
    private Codec<G> gCodec;
    private Codec<H> hCodec;
    private Codec<I> iCodec;
    private Codec<J> jCodec;
    private Codec<K> kCodec;

    private Variant11Maker<T, A> aMaker;
    private Variant11Maker<T, B> bMaker;
    private Variant11Maker<T, C> cMaker;
    private Variant11Maker<T, D> dMaker;
    private Variant11Maker<T, E> eMaker;
    private Variant11Maker<T, F> fMaker;
    private Variant11Maker<T, G> gMaker;
    private Variant11Maker<T, H> hMaker;
    private Variant11Maker<T, I> iMaker;
    private Variant11Maker<T, J> jMaker;
    private Variant11Maker<T, K> kMaker;

    public interface Variant11Maker<T, X> { public T make(X x); }

    /**
     * Construct a codec for 3-element variants.
     *
     * @param ac Codec for the first field of the variant.
     * @param bc Codec for the second field of the variant.
     * @param cc Codec for the third field of the variant.
     * @param dc Codec for the fourth field of the variant.
     * @param ec Codec for the fifth field of the variant.
     * @param fc Codec for the sixth field of the variant.
     * @param gc Codec for the seventh field of the variant.
     * @param hc Codec for the eighth field of the variant.
     * @param ic Codec for the ninth field of the variant.
     * @param jc Codec for the tenth field of the variant.
     * @param kc Codec for the eleventh field of the variant.
     * @param aMaker Constructor/factory for constructing a variant
     * with the first field populated.
     * @param bMaker Constructor/factory for constructing a variant
     * with the second field populated.
     * @param cMaker Constructor/factory for constructing a variant
     * with the third field populated.
     * @param dMaker Constructor/factory for constructing a variant
     * with the fourth field populated.
     * @param eMaker Constructor/factory for constructing a variant
     * with the fifth field populated.
     * @param fMaker Constructor/factory for constructing a variant
     * with the sixth field populated.
     * @param gMaker Constructor/factory for constructing a variant
     * with the seventh field populated.
     * @param hMaker Constructor/factory for constructing a variant
     * with the eighth field populated.
     * @param iMaker Constructor/factory for constructing a variant
     * with the ninth field populated.
     * @param jMaker Constructor/factory for constructing a variant
     * with the tenth field populated.
     * @param kMaker Constructor/factory for constructing a variant
     * with the eleventh field populated.
     */
    public Variant11Codec(
        Codec<A> ac, Codec<B> bc, Codec<C> cc, Codec<D> dc, Codec<E> ec,
        Codec<F> fc, Codec<G> gc, Codec<H> hc, Codec<I> ic, Codec<J> jc,
        Codec<K> kc, Variant11Maker<T, A> aMaker, Variant11Maker<T, B> bMaker,
        Variant11Maker<T, C> cMaker, Variant11Maker<T, D> dMaker,
        Variant11Maker<T, E> eMaker, Variant11Maker<T, F> fMaker,
        Variant11Maker<T, G> gMaker, Variant11Maker<T, H> hMaker,
        Variant11Maker<T, I> iMaker, Variant11Maker<T, J> jMaker,
        Variant11Maker<T, K> kMaker) {
        this.aCodec = ac;
        this.bCodec = bc;
        this.cCodec = cc;
        this.dCodec = dc;
        this.eCodec = ec;
        this.fCodec = fc;
        this.gCodec = gc;
        this.hCodec = hc;
        this.iCodec = ic;
        this.jCodec = jc;
        this.kCodec = kc;
        this.aMaker = aMaker;
        this.bMaker = bMaker;
        this.cMaker = cMaker;
        this.dMaker = dMaker;
        this.eMaker = eMaker;
        this.fMaker = fMaker;
        this.gMaker = gMaker;
        this.hMaker = hMaker;
        this.iMaker = iMaker;
        this.jMaker = jMaker;
        this.kMaker = kMaker;
    }

    public String getTypeName() {
        return "variant<" + aCodec.getTypeName() + "," + bCodec.getTypeName() +
            "," + cCodec.getTypeName() + "," + dCodec.getTypeName() + "," +
            eCodec.getTypeName() + "," + fCodec.getTypeName() + "," +
            gCodec.getTypeName() + "," + hCodec.getTypeName() + "," +
            iCodec.getTypeName() + "," + jCodec.getTypeName() + "," +
            kCodec.getTypeName() + ">";
    }

    public T decode(InputStream in) throws IOException {
        int idx = (int)LongCodec.decodeStatic(in);
        switch (idx) {
        case 0: {
            A a = this.aCodec.decode(in);
            return this.aMaker.make(a);
        }
        case 1: {
            B b = this.bCodec.decode(in);
            return this.bMaker.make(b);
        }
        case 2: {
            C c = this.cCodec.decode(in);
            return this.cMaker.make(c);
        }
        case 3: {
            D d = this.dCodec.decode(in);
            return this.dMaker.make(d);
        }
        case 4: {
            E e = this.eCodec.decode(in);
            return this.eMaker.make(e);
        }
        case 5: {
            F f = this.fCodec.decode(in);
            return this.fMaker.make(f);
        }
        case 6: {
            G g = this.gCodec.decode(in);
            return this.gMaker.make(g);
        }
        case 7: {
            H h = this.hCodec.decode(in);
            return this.hMaker.make(h);
        }
        case 8: {
            I i = this.iCodec.decode(in);
            return this.iMaker.make(i);
        }
        case 9: {
            J j = this.jCodec.decode(in);
            return this.jMaker.make(j);
        }
        case 10: {
            K k = this.kCodec.decode(in);
            return this.kMaker.make(k);
        }
        }
        throw new IOException("Unexpected variant index: " + idx);
    }

    public void encode(OutputStream out, T val) throws IOException {
        int idx = val.getIndex();
        LongCodec.encodeStatic(out, (long)idx);
        switch (idx) {
        case 0: {
            this.aCodec.encode(out, val.get0().get());
            break;
        }
        case 1: {
            this.bCodec.encode(out, val.get1().get());
            break;
        }
        case 2: {
            this.cCodec.encode(out, val.get2().get());
            break;
        }
        case 3: {
            this.dCodec.encode(out, val.get3().get());
            break;
        }
        case 4: {
            this.eCodec.encode(out, val.get4().get());
            break;
        }
        case 5: {
            this.fCodec.encode(out, val.get5().get());
            break;
        }
        case 6: {
            this.gCodec.encode(out, val.get6().get());
            break;
        }
        case 7: {
            this.hCodec.encode(out, val.get7().get());
            break;
        }
        case 8: {
            this.iCodec.encode(out, val.get8().get());
            break;
        }
        case 9: {
            this.jCodec.encode(out, val.get9().get());
            break;
        }
        case 10: {
            this.kCodec.encode(out, val.get10().get());
            break;
        }
        default: {
            assert false;
        }
        }
    }
}


================================================
FILE: java/com/grammatech/gtirb/auxdatacodec/Variant2Codec.java
================================================
package com.grammatech.gtirb.auxdatacodec;

import com.grammatech.gtirb.variant.Variant2;
import java.io.IOException;
import java.io.InputStream;
import java.io.OutputStream;

/**
 * A codec for serializing 2-element variants.
 */
public class Variant2Codec<T extends Variant2<A, B>, A, B> implements Codec<T> {
    private Codec<A> aCodec;
    private Codec<B> bCodec;

    private Variant2Maker<T, A> aMaker;
    private Variant2Maker<T, B> bMaker;

    public interface Variant2Maker<T, X> { public T make(X x); }

    /**
     * Construct a codec for 2-element variants.
     *
     * @param ac Codec for the first field of the variant.
     * @param bc Codec for the second field of the variant.
     * @param aMaker Constructor/factory for constructing a variant
     * with the first field populated.
     * @param bMaker Constructor/factory for constructing a variant
     * with the second field populated.
     */
    public Variant2Codec(Codec<A> ac, Codec<B> bc, Variant2Maker<T, A> aMaker,
                         Variant2Maker<T, B> bMaker) {
        this.aCodec = ac;
        this.bCodec = bc;
        this.aMaker = aMaker;
        this.bMaker = bMaker;
    }

    public String getTypeName() {
        return "variant<" + aCodec.getTypeName() + "," + bCodec.getTypeName() +
            ">";
    }

    public T decode(InputStream in) throws IOException {
        int idx = (int)LongCodec.decodeStatic(in);
        switch (idx) {
        case 0: {
            A a = this.aCodec.decode(in);
            return this.aMaker.make(a);
        }
        case 1: {
            B b = this.bCodec.decode(in);
            return this.bMaker.make(b);
        }
        }
        throw new IOException("Unexpected variant index: " + idx);
    }

    public void encode(OutputStream out, T val) throws IOException {
        int idx = val.getIndex();
        LongCodec.encodeStatic(out, (long)idx);
        switch (idx) {
        case 0: {
            this.aCodec.encode(out, val.get0().get());
            break;
        }
        case 1: {
            this.bCodec.encode(out, val.get1().get());
            break;
        }
        default: {
            assert false;
        }
        }
    }
}


================================================
FILE: java/com/grammatech/gtirb/auxdatacodec/Variant3Codec.java
================================================
package com.grammatech.gtirb.auxdatacodec;

import com.grammatech.gtirb.variant.Variant3;
import java.io.IOException;
import java.io.InputStream;
import java.io.OutputStream;

/**
 * A codec for serializing 3-element variants.
 */
public class Variant3Codec<T extends Variant3<A, B, C>, A, B, C>
    implements Codec<T> {
    private Codec<A> aCodec;
    private Codec<B> bCodec;
    private Codec<C> cCodec;

    private Variant3Maker<T, A> aMaker;
    private Variant3Maker<T, B> bMaker;
    private Variant3Maker<T, C> cMaker;

    public interface Variant3Maker<T, X> { public T make(X a); }

    /**
     * Construct a codec for 3-element variants.
     *
     * @param ac Codec for the first field of the variant.
     * @param bc Codec for the second field of the variant.
     * @param cc Codec for the third field of the variant.
     * @param aMaker Constructor/factory for constructing a variant
     * with the first field populated.
     * @param bMaker Constructor/factory for constructing a variant
     * with the second field populated.
     * @param cMaker Constructor/factory for constructing a variant
     * with the third field populated.
     */
    public Variant3Codec(Codec<A> ac, Codec<B> bc, Codec<C> cc,
                         Variant3Maker<T, A> aMaker, Variant3Maker<T, B> bMaker,
                         Variant3Maker<T, C> cMaker) {
        this.aCodec = ac;
        this.bCodec = bc;
        this.cCodec = cc;
        this.aMaker = aMaker;
        this.bMaker = bMaker;
        this.cMaker = cMaker;
    }

    public String getTypeName() {
        return "variant<" + aCodec.getTypeName() + "," + bCodec.getTypeName() +
            "," + cCodec.getTypeName() + ">";
    }

    public T decode(InputStream in) throws IOException {
        int idx = (int)LongCodec.decodeStatic(in);
        switch (idx) {
        case 0: {
            A a = this.aCodec.decode(in);
            return this.aMaker.make(a);
        }
        case 1: {
            B b = this.bCodec.decode(in);
            return this.bMaker.make(b);
        }
        case 2: {
            C c = this.cCodec.decode(in);
            return this.cMaker.make(c);
        }
        }
        throw new IOException("Unexpected variant index: " + idx);
    }

    public void encode(OutputStream out, T val) throws IOException {
        int idx = val.getIndex();
        LongCodec.encodeStatic(out, (long)idx);
        switch (idx) {
        case 0: {
            this.aCodec.encode(out, val.get0().get());
            break;
        }
        case 1: {
            this.bCodec.encode(out, val.get1().get());
            break;
        }
        case 2: {
            this.cCodec.encode(out, val.get2().get());
            break;
        }
        default: {
            assert false;
        }
        }
    }
}


================================================
FILE: java/com/grammatech/gtirb/tuple/Tuple1.java
================================================
package com.grammatech.gtirb.tuple;

/**
 * Immutable collection of one element of any type.
 *
 * Note that this class is abstract. Intended use is to extend this
 * class with a simple wrapper that uses named getters/setters.
 */
public abstract class Tuple1<A> {

    private final A first;

    /**
     * Class constructor for a Tuple1. Once created, a tuple cannot be
     * modified.
     * @param  first  The first element of the tuple.
     */
    protected Tuple1(A first) { this.first = first; }

    /**
     * Get the first element of the {@link Tuple1}.
     *
     * @return  The first element.
     */
    public A get0() { return this.first; }

    /**
     * Implementation of deep equality.
     * @param other The other object to compare equality against
     * @return True of other is equal to this object.
     */
    @Override
    public boolean equals(Object other) {
        if (other == this) {
            return true;
        }

        if (!(other instanceof Tuple1<?>)) {
            return false;
        }

        Tuple1<?> asTuple1 = (Tuple1<?>)other;
        return this.first.equals(asTuple1.first);
    }
}


================================================
FILE: java/com/grammatech/gtirb/tuple/Tuple2.java
================================================
/*
 *  Copyright (C) 2020-2023 GrammaTech, Inc.
 *
 *  This code is licensed under the MIT license. See the LICENSE file in the
 *  project root for license terms.
 *
 *  This project is sponsored by the Office of Naval Research, One Liberty
 *  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
 *  N68335-17-C-0700.  The content of the information does not necessarily
 *  reflect the position or policy of the Government and no official
 *  endorsement should be inferred.
 *
 */

package com.grammatech.gtirb.tuple;

/**
 * Immutable collection of two elements of any type.
 *
 * Note that this class is abstract. Intended use is to extend this
 * class with a simple wrapper that uses named getters/setters.
 */
public abstract class Tuple2<A, B> {

    private final A first;
    private final B second;

    /**
     * Class constructor for a Tuple2. Once created, a tuple cannot be
     * modified.
     * @param  first  The first element of the tuple.
     * @param  second  The second element of the tuple.
     */
    protected Tuple2(A first, B second) {
        this.first = first;
        this.second = second;
    }

    /**
     * Get the first element of the {@link Tuple2}.
     *
     * @return  The first element.
     */
    public A get0() { return this.first; }

    /**
     * Get the second element of the {@link Tuple2}.
     *
     * @return  The second element.
     */
    public B get1() { return this.second; }

    /**
     * Implementation of deep equality.
     * @param other The other object to compare equality against
     * @return True of other is equal to this object.
     */
    @Override
    public boolean equals(Object other) {
        if (other == this) {
            return true;
        }

        if (!(other instanceof Tuple2<?, ?>)) {
            return false;
        }

        Tuple2<?, ?> asTuple2 = (Tuple2<?, ?>)other;
        return this.first.equals(asTuple2.first) &&
            this.second.equals(asTuple2.second);
    }
}


================================================
FILE: java/com/grammatech/gtirb/tuple/Tuple3.java
================================================
/*
 *  Copyright (C) 2020-2021 GrammaTech, Inc.
 *
 *  This code is licensed under the MIT license. See the LICENSE file in the
 *  project root for license terms.
 *
 *  This project is sponsored by the Office of Naval Research, One Liberty
 *  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
 *  N68335-17-C-0700.  The content of the information does not necessarily
 *  reflect the position or policy of the Government and no official
 *  endorsement should be inferred.
 *
 */

package com.grammatech.gtirb.tuple;

/**
 * Immutable collection of three elements of any type.
 *
 * Note that this class is abstract. Intended use is to extend this
 * class with a simple wrapper that uses named getters/setters.
 */
public abstract class Tuple3<A, B, C> {

    private final A first;
    private final B second;
    private final C third;

    /**
     * Class constructor for a Tuple3. Once created, a tuple cannot be
     * modified.
     * @param  first  The first element of the tuple.
     * @param  second  The second element of the tuple.
     * @param  third  The third element of the tuple.
     */
    protected Tuple3(A first, B second, C third) {
        this.first = first;
        this.second = second;
        this.third = third;
    }

    /**
     * Get the first element of the {@link Tuple3}.
     *
     * @return  The first element.
     */
    public A get0() { return this.first; }

    /**
     * Get the second element of the {@link Tuple3}.
     *
     * @return  The second element.
     */
    public B get1() { return this.second; }

    /**
     * Get the third element of the {@link Tuple3}.
     *
     * @return  The third element.
     */
    public C get2() { return this.third; }

    /**
     * Implementation of deep equality.
     * @param other The other object to compare equality against
     * @return True of other is equal to this object.
     */
    @Override
    public boolean equals(Object other) {
        if (other == this) {
            return true;
        }

        if (!(other instanceof Tuple3<?, ?, ?>)) {
            return false;
        }

        Tuple3<?, ?, ?> asTuple3 = (Tuple3<?, ?, ?>)other;
        return this.first.equals(asTuple3.first) &&
            this.second.equals(asTuple3.second) &&
            this.third.equals(asTuple3.third);
    }
}


================================================
FILE: java/com/grammatech/gtirb/tuple/Tuple4.java
================================================
/*
 *  Copyright (C) 2020-2021 GrammaTech, Inc.
 *
 *  This code is licensed under the MIT license. See the LICENSE file in the
 *  project root for license terms.
 *
 *  This project is sponsored by the Office of Naval Research, One Liberty
 *  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
 *  N68335-17-C-0700.  The content of the information does not necessarily
 *  reflect the position or policy of the Government and no official
 *  endorsement should be inferred.
 *
 */

package com.grammatech.gtirb.tuple;

/**
 * Immutable collection of four elements of any type.
 *
 * Note that this class is abstract. Intended use is to extend this
 * class with a simple wrapper that uses named getters/setters.
 */
public abstract class Tuple4<A, B, C, D> {

    private final A first;
    private final B second;
    private final C third;
    private final D fourth;

    /**
     * Class constructor for a Tuple4. Once created, a tuple cannot be
     * modified.
     * @param  first  The first element of the tuple.
     * @param  second  The second element of the tuple.
     * @param  third  The third element of the tuple.
     * @param  fourth  The fourth element of the tuple.
     */
    protected Tuple4(A first, B second, C third, D fourth) {
        this.first = first;
        this.second = second;
        this.third = third;
        this.fourth = fourth;
    }

    /**
     * Get the first element of the {@link Tuple4}.
     *
     * @return  The first element.
     */
    public A get0() { return this.first; }

    /**
     * Get the second element of the {@link Tuple4}.
     *
     * @return  The second element.
     */
    public B get1() { return this.second; }

    /**
     * Get the third element of the {@link Tuple4}.
     *
     * @return  The third element.
     */
    public C get2() { return this.third; }

    /**
     * Get the fourth element of the {@link Tuple4}.
     *
     * @return  The fourth element.
     */
    public D get3() { return this.fourth; }

    /**
     * Implementation of deep equality.
     * @param other The other object to compare equality against
     * @return True of other is equal to this object.
     */
    @Override
    public boolean equals(Object other) {
        if (other == this) {
            return true;
        }

        if (!(other instanceof Tuple4<?, ?, ?, ?>)) {
            return false;
        }

        Tuple4<?, ?, ?, ?> asTuple4 = (Tuple4<?, ?, ?, ?>)other;
        return this.first.equals(asTuple4.first) &&
            this.second.equals(asTuple4.second) &&
            this.third.equals(asTuple4.third) &&
            this.fourth.equals(asTuple4.fourth);
    }
}


================================================
FILE: java/com/grammatech/gtirb/tuple/Tuple5.java
================================================
/*
 *  Copyright (C) 2020-2021 GrammaTech, Inc.
 *
 *  This code is licensed under the MIT license. See the LICENSE file in the
 *  project root for license terms.
 *
 *  This project is sponsored by the Office of Naval Research, One Liberty
 *  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
 *  N68335-17-C-0700.  The content of the information does not necessarily
 *  reflect the position or policy of the Government and no official
 *  endorsement should be inferred.
 *
 */

package com.grammatech.gtirb.tuple;

/**
 * Immutable collection of five elements of any type.
 *
 * Note that this class is abstract. Intended use is to extend this
 * class with a simple wrapper that uses named getters/setters.
 */
public abstract class Tuple5<A, B, C, D, E> {

    private final A first;
    private final B second;
    private final C third;
    private final D fourth;
    private final E fifth;

    /**
     * Class constructor for a Tuple5. Once created, a tuple cannot be
     * modified.
     * @param  first  The first element of the tuple.
     * @param  second  The second element of the tuple.
     * @param  third  The third element of the tuple.
     * @param  fourth  The fourth element of the tuple.
     * @param  fifth  The fifth element of the tuple.
     */
    protected Tuple5(A first, B second, C third, D fourth, E fifth) {
        this.first = first;
        this.second = second;
        this.third = third;
        this.fourth = fourth;
        this.fifth = fifth;
    }

    /**
     * Get the first element of the {@link Tuple5}.
     *
     * @return  The first element.
     */
    public A get0() { return this.first; }

    /**
     * Get the second element of the {@link Tuple5}.
     *
     * @return  The second element.
     */
    public B get1() { return this.second; }

    /**
     * Get the third element of the {@link Tuple5}.
     *
     * @return  The third element.
     */
    public C get2() { return this.third; }

    /**
     * Get the fourth element of the {@link Tuple5}.
     *
     * @return  The fourth element.
     */
    public D get3() { return this.fourth; }

    /**
     * Get the fifth element of the {@link Tuple5}.
     *
     * @return  The fifth element.
     */
    public E get4() { return this.fifth; }

    /**
     * Implementation of deep equality.
     * @param other The other object to compare equality against
     * @return True of other is equal to this object.
     */
    @Override
    public boolean equals(Object other) {
        if (other == this) {
            return true;
        }

        if (!(other instanceof Tuple5<?, ?, ?, ?, ?>)) {
            return false;
        }

        Tuple5<?, ?, ?, ?, ?> asTuple5 = (Tuple5<?, ?, ?, ?, ?>)other;
        return this.first.equals(asTuple5.first) &&
            this.second.equals(asTuple5.second) &&
            this.third.equals(asTuple5.third) &&
            this.fourth.equals(asTuple5.fourth) &&
            this.fifth.equals(asTuple5.fifth);
    }
}


================================================
FILE: java/com/grammatech/gtirb/variant/Token.java
================================================
package com.grammatech.gtirb.variant;

/**
 * This class contains a bunch of marker classes that are used
 * exlusively to control variant construction. An instance of
 * the class TX can be passed to the variant's constructor to
 * indicate that the constructor is being initialized with the
 * Xth field in the variant.
 */
public class Token {
    public static class T0 {}
    public static class T1 {}
    public static class T2 {}
    public static class T3 {}
    public static class T4 {}
    public static class T5 {}
    public static class T6 {}
    public static class T7 {}
    public static class T8 {}
    public static class T9 {}
    public static class T10 {}
}


================================================
FILE: java/com/grammatech/gtirb/variant/Variant11.java
================================================
package com.grammatech.gtirb.variant;

import java.util.Optional;

/**
 * A 11-valued variant. The variant can store a single object that is
 * of one of the generic parameter types provided.
 *
 * Note that this class is abstract. Intended use is to extend this
 * class with a simple wrapper that uses named getters/setters.
 */
public abstract class Variant11<A, B, C, D, E, F, G, H, I, J, K> {
    private Object o;
    private int index;

    /**
     * Initialize the variant with an object of the first type.
     *
     * @param tok This is a marker parameter indicating which
     * field of the variant is to be populated by the constructor.
     * @param o The object to populate the variant with.
     */
    protected Variant11(Token.T0 tok, A o) {
        this.index = 0;
        this.o = o;
    }

    /**
     * Initialize the variant with an object of the second type.
     *
     * @param tok This is a marker parameter indicating which
     * field of the variant is to be populated by the constructor.
     * @param o The object to populate the variant with.
     */
    protected Variant11(Token.T1 tok, B o) {
        this.index = 1;
        this.o = o;
    }

    /**
     * Initialize the variant with an object of the third type.
     *
     * @param tok This is a marker parameter indicating which
     * field of the variant is to be populated by the constructor.
     * @param o The object to populate the variant with.
     */
    protected Variant11(Token.T2 tok, C o) {
        this.index = 2;
        this.o = o;
    }

    /**
     * Initialize the variant with an object of the fourth type.
     *
     * @param tok This is a marker parameter indicating which
     * field of the variant is to be populated by the constructor.
     * @param o The object to populate the variant with.
     */
    protected Variant11(Token.T3 tok, D o) {
        this.index = 3;
        this.o = o;
    }

    /**
     * Initialize the variant with an object of the fifth type.
     *
     * @param tok This is a marker parameter indicating which
     * field of the variant is to be populated by the constructor.
     * @param o The object to populate the variant with.
     */
    protected Variant11(Token.T4 tok, E o) {
        this.index = 4;
        this.o = o;
    }

    /**
     * Initialize the variant with an object of the sixth type.
     *
     * @param tok This is a marker parameter indicating which
     * field of the variant is to be populated by the constructor.
     * @param o The object to populate the variant with.
     */
    protected Variant11(Token.T5 tok, F o) {
        this.index = 5;
        this.o = o;
    }

    /**
     * Initialize the variant with an object of the seventh type.
     *
     * @param tok This is a marker parameter indicating which
     * field of the variant is to be populated by the constructor.
     * @param o The object to populate the variant with.
     */
    protected Variant11(Token.T6 tok, G o) {
        this.index = 6;
        this.o = o;
    }

    /**
     * Initialize the variant with an object of the eighth type.
     *
     * @param tok This is a marker parameter indicating which
     * field of the variant is to be populated by the constructor.
     * @param o The object to populate the variant with.
     */
    protected Variant11(Token.T7 tok, H o) {
        this.index = 7;
        this.o = o;
    }

    /**
     * Initialize the variant with an object of the ninth type.
     *
     * @param tok This is a marker parameter indicating which
     * field of the variant is to be populated by the constructor.
     * @param o The object to populate the variant with.
     */
    protected Variant11(Token.T8 tok, I o) {
        this.index = 8;
        this.o = o;
    }

    /**
     * Initialize the variant with an object of the tenth type.
     *
     * @param tok This is a marker parameter indicating which
     * field of the variant is to be populated by the constructor.
     * @param o The object to populate the variant with.
     */
    protected Variant11(Token.T9 tok, J o) {
        this.index = 9;
        this.o = o;
    }

    /**
     * Initialize the variant with an object of the eleventh type.
     *
     * @param tok This is a marker parameter indicating which
     * field of the variant is to be populated by the constructor.
     * @param o The object to populate the variant with.
     */
    protected Variant11(Token.T10 tok, K o) {
        this.index = 10;
        this.o = o;
    }

    /**
     * Get the field index that is populated in this variant.
     *
     * @return The index (0-based) of the field of the variant.
     */
    public int getIndex() { return this.index; }

    /**
     * Get the object in the first field of the variant.
     *
     * @return If the field in the variant is populated, the return
     * value is the populated object wrapped in Optional. Otherwise
     * returns Optional.empty().
     */
    public Optional<A> get0() {
        if (this.index == 0) {
            @SuppressWarnings("unchecked") A a = (A)o;
            return Optional.of(a);
        } else {
            return Optional.empty();
        }
    }

    /**
     * Get the object in the second field of the variant.
     *
     * @return If the field in the variant is populated, the return
     * value is the populated object wrapped in Optional. Otherwise
     * returns Optional.empty().
     */
    public Optional<B> get1() {
        if (this.index == 1) {
            @SuppressWarnings("unchecked") B b = (B)o;
            return Optional.of(b);
        } else {
            return Optional.empty();
        }
    }

    /**
     * Get the object in the third field of the variant.
     *
     * @return If the field in the variant is populated, the return
     * value is the populated object wrapped in Optional. Otherwise
     * returns Optional.empty().
     */
    public Optional<C> get2() {
        if (this.index == 2) {
            @SuppressWarnings("unchecked") C c = (C)o;
            return Optional.of(c);
        } else {
            return Optional.empty();
        }
    }

    /**
     * Get the object in the fourth field of the variant.
     *
     * @return If the field in the variant is populated, the return
     * value is the populated object wrapped in Optional. Otherwise
     * returns Optional.empty().
     */
    public Optional<D> get3() {
        if (this.index == 3) {
            @SuppressWarnings("unchecked") D d = (D)o;
            return Optional.of(d);
        } else {
            return Optional.empty();
        }
    }

    /**
     * Get the object in the fifth field of the variant.
     *
     * @return If the field in the variant is populated, the return
     * value is the populated object wrapped in Optional. Otherwise
     * returns Optional.empty().
     */

    public Optional<E> get4() {
        if (this.index == 4) {
            @SuppressWarnings("unchecked") E e = (E)o;
            return Optional.of(e);
        } else {
            return Optional.empty();
        }
    }

    /**
     * Get the object in the sixth field of the variant.
     *
     * @return If the field in the variant is populated, the return
     * value is the populated object wrapped in Optional. Otherwise
     * returns Optional.empty().
     */
    public Optional<F> get5() {
        if (this.index == 5) {
            @SuppressWarnings("unchecked") F f = (F)o;
            return Optional.of(f);
        } else {
            return Optional.empty();
        }
    }

    /**
     * Get the object in the seventh field of the variant.
     *
     * @return If the field in the variant is populated, the return
     * value is the populated object wrapped in Optional. Otherwise
     * returns Optional.empty().
     */
    public Optional<G> get6() {
        if (this.index == 6) {
            @SuppressWarnings("unchecked") G g = (G)o;
            return Optional.of(g);
        } else {
            return Optional.empty();
        }
    }

    /**
     * Get the object in the eighth field of the variant.
     *
     * @return If the field in the variant is populated, the return
     * value is the populated object wrapped in Optional. Otherwise
     * returns Optional.empty().
     */
    public Optional<H> get7() {
        if (this.index == 7) {
            @SuppressWarnings("unchecked") H h = (H)o;
            return Optional.of(h);
        } else {
            return Optional.empty();
        }
    }

    /**
     * Get the object in the ninth field of the variant.
     *
     * @return If the field in the variant is populated, the return
     * value is the populated object wrapped in Optional. Otherwise
     * returns Optional.empty().
     */
    public Optional<I> get8() {
        if (this.index == 8) {
            @SuppressWarnings("unchecked") I i = (I)o;
            return Optional.of(i);
        } else {
            return Optional.empty();
        }
    }

    /**
     * Get the object in the tenth field of the variant.
     *
     * @return If the field in the variant is populated, the return
     * value is the populated object wrapped in Optional. Otherwise
     * returns Optional.empty().
     */
    public Optional<J> get9() {
        if (this.index == 9) {
            @SuppressWarnings("unchecked") J j = (J)o;
            return Optional.of(j);
        } else {
            return Optional.empty();
        }
    }

    /**
     * Get the object in the eleventh field of the variant.
     *
     * @return If the field in the variant is populated, the return
     * value is the populated object wrapped in Optional. Otherwise
     * returns Optional.empty().
     */
    public Optional<K> get10() {
        if (this.index == 10) {
            @SuppressWarnings("unchecked") K k = (K)o;
            return Optional.of(k);
        } else {
            return Optional.empty();
        }
    }

    /**
     * Set the first field of the variant. If any other field
     * is populated, that field is dropped.
     *
     * @param o The object to populate the field with.
     */
    public void set0(A o) {
        this.index = 0;
        this.o = o;
    }

    /**
     * Set the second field of the variant. If any other field
     * is populated, that field is dropped.
     *
     * @param o The object to populate the field with.
     */
    public void set1(B o) {
        this.index = 1;
        this.o = o;
    }

    /**
     * Set the third field of the variant. If any other field
     * is populated, that field is dropped.
     *
     * @param o The object to populate the field with.
     */
    public void set2(C o) {
        this.index = 2;
        this.o = o;
    }

    /**
     * Set the fourth field of the variant. If any other field
     * is populated, that field is dropped.
     *
     * @param o The object to populate the field with.
     */
    public void set3(D o) {
        this.index = 3;
        this.o = o;
    }

    /**
     * Set the fifth field of the variant. If any other field
     * is populated, that field is dropped.
     *
     * @param o The object to populate the field with.
     */
    public void set4(E o) {
        this.index = 4;
        this.o = o;
    }

    /**
     * Set the sixth field of the variant. If any other field
     * is populated, that field is dropped.
     *
     * @param o The object to populate the field with.
     */
    public void set5(F o) {
        this.index = 5;
        this.o = o;
    }

    /**
     * Set the seventh field of the variant. If any other field
     * is populated, that field is dropped.
     *
     * @param o The object to populate the field with.
     */
    public void set6(G o) {
        this.index = 6;
        this.o = o;
    }

    /**
     * Set the eighth field of the variant. If any other field
     * is populated, that field is dropped.
     *
     * @param o The object to populate the field with.
     */
    public void set7(H o) {
        this.index = 7;
        this.o = o;
    }

    /**
     * Set the ninth field of the variant. If any other field
     * is populated, that field is dropped.
     *
     * @param o The object to populate the field with.
     */
    public void set8(I o) {
        this.index = 8;
        this.o = o;
    }

    /**
     * Set the tenth field of the variant. If any other field
     * is populated, that field is dropped.
     *
     * @param o The object to populate the field with.
     */
    public void set9(J o) {
        this.index = 9;
        this.o = o;
    }

    /**
     * Set the eleventh field of the variant. If any other field
     * is populated, that field is dropped.
     *
     * @param o The object to populate the field with.
     */
    public void set10(K o) {
        this.index = 10;
        this.o = o;
    }

    /**
     * Implementation of deep equality.
     * @param other The other object to compare equality against
     * @return True of other is equal to this object.
     */
    @Override
    public boolean equals(Object other) {
        if (other == this) {
            return true;
        }

        if (!(other instanceof Variant11<?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?>)) {
            return false;
        }

        Variant11<?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?> asVariant =
            (Variant11<?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?>)other;
        return this.index == asVariant.index && this.o.equals(asVariant.o);
    }
}


================================================
FILE: java/com/grammatech/gtirb/variant/Variant2.java
================================================
package com.grammatech.gtirb.variant;

import java.util.Optional;

/**
 * A 2-valued variant. The variant can store a single object that is
 * of one of the generic parameter types provided.
 *
 * Note that this class is abstract. Intended use is to extend this
 * class with a simple wrapper that uses named getters/setters.
 */
public abstract class Variant2<A, B> {
    private Object o;
    private int index;

    /**
     * Initialize the variant with an object of the first type.
     *
     * @param tok This is a marker parameter indicating which
     * field of the variant is to be populated by the constructor.
     * @param o The object to populate the variant with.
     */
    protected Variant2(Token.T0 tok, A o) {
        this.index = 0;
        this.o = o;
    }

    /**
     * Initialize the variant with an object of the second type.
     *
     * @param tok This is a marker parameter indicating which
     * field of the variant is to be populated by the constructor.
     * @param o The object to populate the variant with.
     */
    protected Variant2(Token.T1 tok, B o) {
        this.index = 1;
        this.o = o;
    }

    /**
     * Get the field index that is populated in this variant.
     *
     * @return The index (0-based) of the field of the variant.
     */
    public int getIndex() { return this.index; }

    /**
     * Get the object in the first field of the variant.
     *
     * @return If the field in the variant is populated, the return
     * value is the populated object wrapped in Optional. Otherwise
     * returns Optional.empty().
     */
    public Optional<A> get0() {
        if (this.index == 0) {
            @SuppressWarnings("unchecked") A a = (A)o;
            return Optional.of(a);
        } else {
            return Optional.empty();
        }
    }

    /**
     * Get the object in the second field of the variant.
     *
     * @return If the field in the variant is populated, the return
     * value is the populated object wrapped in Optional. Otherwise
     * returns Optional.empty().
     */
    public Optional<B> get1() {
        if (this.index == 1) {
            @SuppressWarnings("unchecked") B b = (B)o;
            return Optional.of(b);
        } else {
            return Optional.empty();
        }
    }

    /**
     * Set the first field of the variant. If any other field
     * is populated, that field is dropped.
     *
     * @param o The object to populate the field with.
     */
    public void set0(A o) {
        this.index = 0;
        this.o = o;
    }

    /**
     * Set the second field of the variant. If any other field
     * is populated, that field is dropped.
     *
     * @param o The object to populate the field with.
     */
    public void set1(B o) {
        this.index = 1;
        this.o = o;
    }

    /**
     * Implementation of deep equality.
     * @param other The other object to compare equality against
     * @return True of other is equal to this object.
     */
    @Override
    public boolean equals(Object other) {
        if (other == this) {
            return true;
        }

        if (!(other instanceof Variant2<?, ?>)) {
            return false;
        }

        Variant2<?, ?> asVariant = (Variant2<?, ?>)other;
        return this.index == asVariant.index && this.o.equals(asVariant.o);
    }
}


================================================
FILE: java/com/grammatech/gtirb/variant/Variant3.java
================================================
package com.grammatech.gtirb.variant;

import java.util.Optional;

/**
 * A 3-valued variant. The variant can store a single object that is
 * of one of the generic parameter types provided.
 *
 * Note that this class is abstract. Intended use is to extend this
 * class with a simple wrapper that uses named getters/setters.
 */
public abstract class Variant3<A, B, C> {
    private Object o;
    private int index;

    /**
     * Initialize the variant with an object of the first type.
     *
     * @param tok This is a marker parameter indicating which
     * field of the variant is to be populated by the constructor.
     * @param o The object to populate the variant with.
     */
    protected Variant3(Token.T0 tok, A o) {
        this.index = 0;
        this.o = o;
    }

    /**
     * Initialize the variant with an object of the second type.
     *
     * @param tok This is a marker parameter indicating which
     * field of the variant is to be populated by the constructor.
     * @param o The object to populate the variant with.
     */
    protected Variant3(Token.T1 tok, B o) {
        this.index = 1;
        this.o = o;
    }

    /**
     * Initialize the variant with an object of the third type.
     *
     * @param tok This is a marker parameter indicating which
     * field of the variant is to be populated by the constructor.
     * @param o The object to populate the variant with.
     */
    protected Variant3(Token.T2 tok, C o) {
        this.index = 2;
        this.o = o;
    }

    /**
     * Get the field index that is populated in this variant.
     *
     * @return The index (0-based) of the field of the variant.
     */
    public int getIndex() { return this.index; }

    /**
     * Get the object in the first field of the variant.
     *
     * @return If the field in the variant is populated, the return
     * value is the populated object wrapped in Optional. Otherwise
     * returns Optional.empty().
     */
    public Optional<A> get0() {
        if (this.index == 0) {
            @SuppressWarnings("unchecked") A a = (A)o;
            return Optional.of(a);
        } else {
            return Optional.empty();
        }
    }

    /**
     * Get the object in the second field of the variant.
     *
     * @return If the field in the variant is populated, the return
     * value is the populated object wrapped in Optional. Otherwise
     * returns Optional.empty().
     */
    public Optional<B> get1() {
        if (this.index == 1) {
            @SuppressWarnings("unchecked") B b = (B)o;
            return Optional.of(b);
        } else {
            return Optional.empty();
        }
    }

    /**
     * Get the object in the third field of the variant.
     *
     * @return If the field in the variant is populated, the return
     * value is the populated object wrapped in Optional. Otherwise
     * returns Optional.empty().
     */
    public Optional<C> get2() {
        if (this.index == 2) {
            @SuppressWarnings("unchecked") C c = (C)o;
            return Optional.of(c);
        } else {
            return Optional.empty();
        }
    }

    /**
     * Set the first field of the variant. If any other field
     * is populated, that field is dropped.
     *
     * @param o The object to populate the field with.
     */
    public void set0(A o) {
        this.index = 0;
        this.o = o;
    }

    /**
     * Set the second field of the variant. If any other field
     * is populated, that field is dropped.
     *
     * @param o The object to populate the field with.
     */
    public void set1(B o) {
        this.index = 1;
        this.o = o;
    }

    /**
     * Set the third field of the variant. If any other field
     * is populated, that field is dropped.
     *
     * @param o The object to populate the field with.
     */
    public void set2(C o) {
        this.index = 2;
        this.o = o;
    }

    /**
     * Implementation of deep equality.
     * @param other The other object to compare equality against
     * @return True of other is equal to this object.
     */
    @Override
    public boolean equals(Object other) {
        if (other == this) {
            return true;
        }

        if (!(other instanceof Variant3<?, ?, ?>)) {
            return false;
        }

        Variant3<?, ?, ?> asVariant = (Variant3<?, ?, ?>)other;
        return this.index == asVariant.index && this.o.equals(asVariant.o);
    }
}


================================================
FILE: java/pom.xml.in
================================================
<project>
  <modelVersion>4.0.0</modelVersion>

  <groupId>com.grammatech.gtirb</groupId>
  <artifactId>gtirb_api</artifactId>
  <version>
    @PROJECT_VERSION_MAJOR@.@PROJECT_VERSION_MINOR@.@PROJECT_VERSION_PATCH@@GTIRB_JAVA_SNAPSHOT_SUFFIX@
  </version>

  <name>${project.groupId}:${project.artifactId}</name>
  <description>
    The GrammaTech Intermediate Representation for Binaries (GTIRB) is a
    machine code analysis and rewriting data structure.
  </description>
  <url>https://github.com/GrammaTech/gtirb</url>

  <licenses>
    <license>
      <name>MIT License</name>
      <url>
        https://raw.githubusercontent.com/GrammaTech/gtirb/master/LICENSE.txt
      </url>
    </license>
  </licenses>

  <developers>
    <developer>
      <name>Timothy Neale</name>
      <email>tneale@grammatech.com</email>
      <organization>GrammaTech</organization>
      <organizationUrl>https://www.grammatech.com/</organizationUrl>
    </developer>
  </developers>

  <scm>
    <connection>scm:git:git://github.com/GrammaTech/gtirb.git</connection>
    <developerConnection>scm:git:ssh://github.com:GrammaTech/gtirb.git</developerConnection>
    <url>http://github.com/GrammaTech/gtirb/tree/master</url>
  </scm>

  <distributionManagement>
    <snapshotRepository>
      <id>central</id>
      <url>https://central.sonatype.com/repository/maven-snapshots/</url>
    </snapshotRepository>
    <repository>
      <id>central</id>
      <url>https://central.sonatype.com/</url>
    </repository>
  </distributionManagement>

  <properties>
    <project.build.sourceEncoding>UTF-8</project.build.sourceEncoding>
    <maven.compiler.source>1.8</maven.compiler.source>
    <maven.compiler.target>1.8</maven.compiler.target>
  </properties>

  <build>
    <sourceDirectory>src</sourceDirectory>
    <plugins>
      <plugin>
        <groupId>org.sonatype.central</groupId>
        <artifactId>central-publishing-maven-plugin</artifactId>
        <version>0.8.0</version>
        <extensions>true</extensions>
        <configuration>
          <publishingServerId>central</publishingServerId>
          <autoPublish>true</autoPublish>
        </configuration>
      </plugin>

      <plugin>
        <groupId>org.apache.maven.plugins</groupId>
        <artifactId>maven-source-plugin</artifactId>
        <version>3.2.1</version>
        <executions>
          <execution>
            <id>attach-sources</id>
            <goals>
              <goal>jar</goal>
            </goals>
          </execution>
        </executions>
      </plugin>
      <plugin>
        <groupId>org.apache.maven.plugins</groupId>
        <artifactId>maven-javadoc-plugin</artifactId>
        <version>3.3.1</version>
        <configuration>
          <detectJavaApiLink>false</detectJavaApiLink>
          <excludePackageNames>com.grammatech.gtirb.proto</excludePackageNames>
        </configuration>
        <executions>
          <execution>
            <id>attach-javadocs</id>
            <goals>
              <goal>jar</goal>
            </goals>
          </execution>
        </executions>
      </plugin>

      <plugin>
        <groupId>org.apache.maven.plugins</groupId>
        <artifactId>maven-gpg-plugin</artifactId>
        <version>1.5</version>
        <configuration>
          <useAgent>true</useAgent>
        </configuration>
        <executions>
          <execution>
            <id>sign-artifacts</id>
            <phase>verify</phase>
            <goals>
              <goal>sign</goal>
            </goals>
          </execution>
        </executions>
      </plugin>
    </plugins>
  </build>

  <dependencies>
    <dependency>
      <groupId>com.google.protobuf</groupId>
      <artifactId>protobuf-java</artifactId>
      <version>[@Protobuf_VERSION@,@GTIRB_PROTOBUF_UPPER_BOUND@)</version>
    </dependency>
  </dependencies>
</project>


================================================
FILE: java/settings.gradle
================================================
/*
 * This file was generated by the Gradle 'init' task.
 *
 * The settings file is used to specify which projects to include in your build.
 *
 * Detailed information about configuring a multi-project build in Gradle can be found
 * in the user manual at https://docs.gradle.org/5.6.4/userguide/multi_project_builds.html
 */

rootProject.name = 'gtirb'


================================================
FILE: java/tests/TestAuxData.java
================================================
package tests;

import static org.junit.jupiter.api.Assertions.*;

import com.grammatech.gtirb.AuxDataContainer;
import com.grammatech.gtirb.AuxDataSchema;
import com.grammatech.gtirb.AuxDataSchemas;
import com.grammatech.gtirb.IR;
import com.grammatech.gtirb.Module;
import com.grammatech.gtirb.Offset;
import com.grammatech.gtirb.ProxyBlock;
import com.grammatech.gtirb.Section;
import com.grammatech.gtirb.Symbol;
import com.grammatech.gtirb.auxdatacodec.BoolCodec;
import com.grammatech.gtirb.auxdatacodec.ByteCodec;
import com.grammatech.gtirb.auxdatacodec.Codec;
import com.grammatech.gtirb.auxdatacodec.FloatCodec;
import com.grammatech.gtirb.auxdatacodec.IntegerCodec;
import com.grammatech.gtirb.auxdatacodec.ListCodec;
import com.grammatech.gtirb.auxdatacodec.LongCodec;
import com.grammatech.gtirb.auxdatacodec.MapCodec;
import com.grammatech.gtirb.auxdatacodec.OffsetCodec;
import com.grammatech.gtirb.auxdatacodec.SetCodec;
import com.grammatech.gtirb.auxdatacodec.ShortCodec;
import com.grammatech.gtirb.auxdatacodec.StringCodec;
import com.grammatech.gtirb.auxdatacodec.Tuple1Codec;
import com.grammatech.gtirb.auxdatacodec.Tuple2Codec;
import com.grammatech.gtirb.auxdatacodec.Tuple3Codec;
import com.grammatech.gtirb.auxdatacodec.Tuple4Codec;
import com.grammatech.gtirb.auxdatacodec.Tuple5Codec;
import com.grammatech.gtirb.auxdatacodec.UuidCodec;
import com.grammatech.gtirb.auxdatacodec.Variant11Codec;
import com.grammatech.gtirb.auxdatacodec.Variant2Codec;
import com.grammatech.gtirb.auxdatacodec.Variant3Codec;
import com.grammatech.gtirb.tuple.Tuple1;
import com.grammatech.gtirb.tuple.Tuple2;
import com.grammatech.gtirb.tuple.Tuple3;
import com.grammatech.gtirb.tuple.Tuple4;
import com.grammatech.gtirb.tuple.Tuple5;
import com.grammatech.gtirb.variant.Token;
import com.grammatech.gtirb.variant.Variant11;
import com.grammatech.gtirb.variant.Variant2;
import com.grammatech.gtirb.variant.Variant3;
import java.io.ByteArrayInputStream;
import java.io.ByteArrayOutputStream;
import java.io.IOException;
import java.util.ArrayList;
import java.util.HashMap;
import java.util.HashSet;
import java.util.List;
import java.util.Map;
import java.util.Optional;
import java.util.Set;
import java.util.TreeMap;
import java.util.UUID;
import java.util.stream.Stream;
import org.junit.jupiter.api.Test;
import org.junit.jupiter.params.ParameterizedTest;
import org.junit.jupiter.params.provider.Arguments;
import org.junit.jupiter.params.provider.MethodSource;

class FooSingle extends Tuple1<String> {
    public FooSingle(String s) { super(s); }
}

class FooPair extends Tuple2<String, Long> {
    public FooPair(String s, Long l) { super(s, l); }
}

class FooTriple extends Tuple3<String, Long, Float> {
    public FooTriple(String s, Long l, Float f) { super(s, l, f); }
}

class FooQuadruple extends Tuple4<String, Long, Float, Boolean> {
    public FooQuadruple(String s, Long l, Float f, Boolean b) {
        super(s, l, f, b);
    }
}

class FooQuintuple extends Tuple5<String, Long, Float, Boolean, Integer> {
    public FooQuintuple(String s, Long l, Float f, Boolean b, Integer i) {
        super(s, l, f, b, i);
    }
}

class FooVariant2 extends Variant2<Long, Float> {
    private FooVariant2(Token.T0 tok, Long l) { super(tok, l); }
    private FooVariant2(Token.T1 tok, Float f) { super(tok, f); }
    public static FooVariant2 ofLong(Long l) {
        return new FooVariant2(new Token.T0(), l);
    }
    public static FooVariant2 ofFloat(Float f) {
        return new FooVariant2(new Token.T1(), f);
    }
}

class FooVariant3 extends Variant3<Long, Float, Boolean> {
    private FooVariant3(Token.T0 tok, Long l) { super(tok, l); }
    private FooVariant3(Token.T1 tok, Float f) { super(tok, f); }
    private FooVariant3(Token.T2 tok, Boolean b) { super(tok, b); }
    public static FooVariant3 ofLong(Long l) {
        return new FooVariant3(new Token.T0(), l);
    }
    public static FooVariant3 ofFloat(Float f) {
        return new FooVariant3(new Token.T1(), f);
    }
    public static FooVariant3 ofBoolean(Boolean b) {
        return new FooVariant3(new Token.T2(), b);
    }
}

class FooVariant11
    extends Variant11<Long, Float, Boolean, Integer, String, Long, Float,
                      Boolean, Integer, String, Offset> {
    private FooVariant11(Token.T0 tok, Long l) { super(tok, l); }
    private FooVariant11(Token.T1 tok, Float f) { super(tok, f); }
    private FooVariant11(Token.T2 tok, Boolean b) { super(tok, b); }
    private FooVariant11(Token.T3 tok, Integer i) { super(tok, i); }
    private FooVariant11(Token.T4 tok, String s) { super(tok, s); }
    private FooVariant11(Token.T5 tok, Long l) { super(tok, l); }
    private FooVariant11(Token.T6 tok, Float f) { super(tok, f); }
    private FooVariant11(Token.T7 tok, Boolean b) { super(tok, b); }
    private FooVariant11(Token.T8 tok, Integer i) { super(tok, i); }
    private FooVariant11(Token.T9 tok, String s) { super(tok, s); }
    private FooVariant11(Token.T10 tok, Offset o) { super(tok, o); }
    public static FooVariant11 ofLong1(Long l) {
        return new FooVariant11(new Token.T0(), l);
    }
    public static FooVariant11 ofFloat1(Float f) {
        return new FooVariant11(new Token.T1(), f);
    }
    public static FooVariant11 ofBoolean1(Boolean b) {
        return new FooVariant11(new Token.T2(), b);
    }
    public static FooVariant11 ofInteger1(Integer i) {
        return new FooVariant11(new Token.T3(), i);
    }
    public static FooVariant11 ofString1(String s) {
        return new FooVariant11(new Token.T4(), s);
    }
    public static FooVariant11 ofLong2(Long l) {
        return new FooVariant11(new Token.T5(), l);
    }
    public static FooVariant11 ofFloat2(Float f) {
        return new FooVariant11(new Token.T6(), f);
    }
    public static FooVariant11 ofBoolean2(Boolean b) {
        return new FooVariant11(new Token.T7(), b);
    }
    public static FooVariant11 ofInteger2(Integer i) {
        return new FooVariant11(new Token.T8(), i);
    }
    public static FooVariant11 ofString2(String s) {
        return new FooVariant11(new Token.T9(), s);
    }
    public static FooVariant11 ofOffset(Offset o) {
        return new FooVariant11(new Token.T10(), o);
    }
}

public class TestAuxData {

    private static Stream<Arguments> argProviderForTestCodec() {

        List<Integer> ali = new ArrayList<>();
        ali.add(4);
        ali.add(2);

        List<Float> alf = new ArrayList<>();
        alf.add(5.3f);
        Map<UUID, List<Float>> hm = new HashMap<>();
        hm.put(new UUID(2, 4), alf);

        Set<String> hs = new HashSet<>();
        hs.add("foo");
        hs.add("bar");

        Variant11Codec<FooVariant11, Long, Float, Boolean, Integer, String,
                       Long, Float, Boolean, Integer, String, Offset>
            fooV11Codec = new Variant11Codec<>(
                LongCodec.INT64, new FloatCodec(), new BoolCodec(),
                IntegerCodec.INT32, new StringCodec(), LongCodec.INT64,
                new FloatCodec(), new BoolCodec(), IntegerCodec.INT32,
                new StringCodec(), new OffsetCodec(), FooVariant11::ofLong1,
                FooVariant11::ofFloat1, FooVariant11::ofBoolean1,
                FooVariant11::ofInteger1, FooVariant11::ofString1,
                FooVariant11::ofLong2, FooVariant11::ofFloat2,
                FooVariant11::ofBoolean2, FooVariant11::ofInteger2,
                FooVariant11::ofString2, FooVariant11::ofOffset);

        String expFooV11Name =
            "variant<int64_t,float,bool,int32_t,string,int64_t,float,bool,int32_t,string,Offset>";

        return Stream.of(
            Arguments.of("bool", new BoolCodec(), false),
            Arguments.of("bool", new BoolCodec(), true),
            Arguments.of("int8_t", ByteCodec.INT8, (byte)0),
            Arguments.of("int8_t", ByteCodec.INT8, (byte)42),
            Arguments.of("uint8_t", ByteCodec.UINT8, (byte)43),
            Arguments.of("float", new FloatCodec(), 0.0f),
            Arguments.of("float", new FloatCodec(), 42.5f),
            Arguments.of("int16_t", ShortCodec.INT16, (short)0),
            Arguments.of("int16_t", ShortCodec.INT16, (short)42),
            Arguments.of("uint16_t", ShortCodec.UINT16, (short)43),
            Arguments.of("int32_t", IntegerCodec.INT32, 0),
            Arguments.of("int32_t", IntegerCodec.INT32, 42),
            Arguments.of("uint32_t", IntegerCodec.UINT32, 43),
            Arguments.of("int64_t", LongCodec.INT64, 0L),
            Arguments.of("int64_t", LongCodec.INT64, 42000000000L),
            Arguments.of("uint64_t", LongCodec.UINT64, 43000000000L),
            Arguments.of("string", new StringCodec(), ""),
            Arguments.of("string", new StringCodec(), "abcdefg"),
            Arguments.of("UUID", new UuidCodec(), new UUID(0, 0)),
            Arguments.of("UUID", new UuidCodec(),
                         new UUID(0xFEEDFACECAFEBEEFL, 0xDEADFA11DEADD00DL)),
            Arguments.of("Offset", new OffsetCodec(),
                         new Offset(new UUID(4, 2), 1234)),
            Arguments.of("sequence<int32_t>",
                         new ListCodec<>(IntegerCodec.INT32, ArrayList::new),
                         ali),
            Arguments.of("mapping<UUID,sequence<float>>",
                         new MapCodec<>(
                             new UuidCodec(),
                             new ListCodec<>(new FloatCodec(), ArrayList::new),
                             HashMap::new),
                         hm),
            Arguments.of("set<string>",
                         new SetCodec<>(new StringCodec(), HashSet::new), hs),
            Arguments.of("tuple<string>",
                         new Tuple1Codec<>(new StringCodec(), FooSingle::new),
                         new FooSingle("hello")),
            Arguments.of("tuple<string,int64_t>",
                         new Tuple2Codec<>(new StringCodec(), LongCodec.INT64,
                                           FooPair::new),
                         new FooPair("hello", 27L)),
            Arguments.of("tuple<string,int64_t,float>",
                         new Tuple3Codec<>(new StringCodec(), LongCodec.INT64,
                                           new FloatCodec(), FooTriple::new),
                         new FooTriple("hello", 27L, 3.14f)),
            Arguments.of("tuple<string,int64_t,float,bool>",
                         new Tuple4Codec<>(new StringCodec(), LongCodec.INT64,
                                           new FloatCodec(), new BoolCodec(),
                                           FooQuadruple::new),
                         new FooQuadruple("hello", 27L, 3.14f, true)),
            Arguments.of("tuple<string,int64_t,float,bool,int32_t>",
                         new Tuple5Codec<>(new StringCodec(), LongCodec.INT64,
                                           new FloatCodec(), new BoolCodec(),
                                           IntegerCodec.INT32,
                                           FooQuintuple::new),
                         new FooQuintuple("hello", 27L, 3.14f, true, 42)),
            Arguments.of("variant<int64_t,float>",
                         new Variant2Codec<>(LongCodec.INT64, new FloatCodec(),
                                             FooVariant2::ofLong,
                                             FooVariant2::ofFloat),
                         FooVariant2.ofLong(42L)),
            Arguments.of("variant<int64_t,float>",
                         new Variant2Codec<>(LongCodec.INT64, new FloatCodec(),
                                             FooVariant2::ofLong,
                                             FooVariant2::ofFloat),
                         FooVariant2.ofFloat(3.14f)),
            Arguments.of("variant<int64_t,float,bool>",
                         new Variant3Codec<>(
                             LongCodec.INT64, new FloatCodec(), new BoolCodec(),
                             FooVariant3::ofLong, FooVariant3::ofFloat,
                             FooVariant3::ofBoolean),
                         FooVariant3.ofBoolean(true)),
            Arguments.of(expFooV11Name, fooV11Codec, FooVariant11.ofLong1(42L)),
            Arguments.of(expFooV11Name, fooV11Codec,
                         FooVariant11.ofFloat1(3.14f)),
            Arguments.of(expFooV11Name, fooV11Codec,
                         FooVariant11.ofBoolean1(true)),
            Arguments.of(expFooV11Name, fooV11Codec,
                         FooVariant11.ofInteger1(43)),
            Arguments.of(expFooV11Name, fooV11Codec,
                         FooVariant11.ofString1("abc")),
            Arguments.of(expFooV11Name, fooV11Codec, FooVariant11.ofLong2(44L)),
            Arguments.of(expFooV11Name, fooV11Codec,
                         FooVariant11.ofFloat2(3.145f)),
            Arguments.of(expFooV11Name, fooV11Codec,
                         FooVariant11.ofBoolean2(false)),
            Arguments.of(expFooV11Name, fooV11Codec,
                         FooVariant11.ofInteger2(45)),
            Arguments.of(expFooV11Name, fooV11Codec,
                         FooVariant11.ofString2("def")),
            Arguments.of(
                expFooV11Name, fooV11Codec,
                FooVariant11.ofOffset(new Offset(new UUID(9, 10), 11))));
    }

    @ParameterizedTest(name = "Test codec for protobuf type: {0}")
    @MethodSource("argProviderForTestCodec")
    public <T> void testCodec(String typeName, Codec<T> codec, T val)
        throws IOException {
        assertEquals(codec.getTypeName(), typeName);
        ByteArrayOutputStream os = new ByteArrayOutputStream();
        codec.encode(os, val);
        ByteArrayInputStream is = new ByteArrayInputStream(os.toByteArray());
        T result = codec.decode(is);
        assertEquals(val, result);
    }

    @Test
    public void testAuxDataDecodeEncode() throws IOException {
        // Construct an IR+Module to dangle AuxData off of
        IR ir1 = new IR();
        Module m1 = new Module(
            "test", 0xDEADBEEF, 0, Module.FileFormat.ELF, Module.ISA.IA32,
            "test", new ArrayList<Section>(), new ArrayList<Symbol>(),
            new ArrayList<ProxyBlock>(), null);
        ir1.addModule(m1);

        // Add the AuxData
        assertEquals(Optional.empty(),
                     m1.getAuxData(AuxDataSchemas.functionNames));
        Map<UUID, UUID> func_names = new TreeMap<>();
        func_names.put(new UUID(1, 2), new UUID(3, 4));
        m1.putAuxData(AuxDataSchemas.functionNames, func_names);
        Optional<Map<UUID, UUID>> oad1 =
            m1.getAuxData(AuxDataSchemas.functionNames);
        assertTrue(oad1.isPresent());
        assertEquals(func_names, oad1.get());

        // Serialize/unserialize
        ByteArrayOutputStream os = new ByteArrayOutputStream();
        ir1.saveFile(os);

        ByteArrayInputStream is = new ByteArrayInputStream(os.toByteArray());
        IR ir2 = IR.loadFile(is);
        assertNotNull(ir2);
        List<Module> mods2 = ir2.getModules();
        assertNotNull(mods2);
        Module m2 = mods2.get(0);

        // Fetch the AuxData back.
        Optional<Map<UUID, UUID>> oad2 =
            m2.getAuxData(AuxDataSchemas.functionNames);
        assertTrue(oad2.isPresent());
        assertEquals(func_names, oad2.get());
    }

    AuxDataSchema<Long> aSchema =
        new AuxDataSchema<>("aSchema", LongCodec.UINT64);
    AuxDataSchema<Boolean> anotherSchema =
        new AuxDataSchema<>("anotherSchema", new BoolCodec());

    @Test
    public void testRemoveAuxData() throws IOException {
        Module m = new Module("test", 0xDEADBEEF, 0, Module.FileFormat.ELF,
                              Module.ISA.IA32, "test", new ArrayList<Section>(),
                              new ArrayList<Symbol>(),
                              new ArrayList<ProxyBlock>(), null);

        m.putAuxData(aSchema, 42L);
        assertEquals(Optional.of(42L), m.getAuxData(aSchema));

        boolean rv = m.removeAuxData("aSchema");
        assertTrue(rv);
        assertEquals(Optional.empty(), m.getAuxData(aSchema));
        rv = m.removeAuxData("aSchema");
        assertFalse(rv);

        m.putAuxData(aSchema, 43L);
        assertEquals(Optional.of(43L), m.getAuxData(aSchema));

        rv = m.removeAuxData(aSchema);
        assertTrue(rv);
        assertEquals(Optional.empty(), m.getAuxData(aSchema));
        rv = m.removeAuxData(aSchema);
        assertFalse(rv);
    }

    @Test
    public void testClearAuxData() throws IOException {
        Module m = new Module("test", 0xDEADBEEF, 0, Module.FileFormat.ELF,
                              Module.ISA.IA32, "test", new ArrayList<Section>(),
                              new ArrayList<Symbol>(),
                              new ArrayList<ProxyBlock>(), null);

        m.putAuxData(aSchema, 42L);
        m.putAuxData(anotherSchema, true);
        assertEquals(Optional.of(42L), m.getAuxData(aSchema));
        assertEquals(Optional.of(true), m.getAuxData(anotherSchema));

        m.clearAuxData();
        assertEquals(Optional.empty(), m.getAuxData(aSchema));
        assertEquals(Optional.empty(), m.getAuxData(anotherSchema));
    }

    @Test
    public void testGetAuxDataMap() throws IOException {
        Module m = new Module("test", 0xDEADBEEF, 0, Module.FileFormat.ELF,
                              Module.ISA.IA32, "test", new ArrayList<Section>(),
                              new ArrayList<Symbol>(),
                              new ArrayList<ProxyBlock>(), null);

        m.putAuxData(aSchema, 42L);
        m.putAuxData(anotherSchema, true);
        assertEquals(Optional.of(42L), m.getAuxData(aSchema));
        assertEquals(Optional.of(true), m.getAuxData(anotherSchema));

        Map<String, AuxDataContainer.AuxData> adMap = m.getAuxDataMap();
        assertTrue(adMap.containsKey(aSchema.getName()));
        assertTrue(adMap.containsKey(anotherSchema.getName()));
        assertThrows(UnsupportedOperationException.class, () -> adMap.clear());
    }
}


================================================
FILE: java/tests/TestByteIntervals.java
================================================
package tests;
import static org.junit.jupiter.api.Assertions.*;

import com.grammatech.gtirb.*;
import com.grammatech.gtirb.Module;
import com.grammatech.gtirb.Module.FileFormat;
import com.grammatech.gtirb.Module.ISA;
import java.io.File;
import java.util.*;
import org.junit.jupiter.api.Test;

public class TestByteIntervals {

    @Test
    void testByteIntervalSaveAndLoad() throws Exception {
        IR ir = new IR();
        Module module = new Module("c:/foo.exe", 0xCAFE, 0xBEEF, FileFormat.ELF,
                                   ISA.X64, "myModule");
        Section section =
            new Section("mySection", new HashSet<Section.SectionFlag>(),
                        new ArrayList<ByteInterval>());
        ByteInterval byteInterval =
            new ByteInterval("SaveAndLoad".getBytes(), 0xFEED);
        section.addByteInterval(byteInterval);
        ir.addModule(module);
        module.addSection(section);

        // Reset address
        byteInterval.clearAddress();

        File file = File.createTempFile("temp", null);
        String filename = file.getName();
        try {
            ir.saveFile(filename);
        } catch (Exception e) {
            file.delete();
            throw e;
        }

        IR ir_reloaded;
        try {
            ir_reloaded = IR.loadFile(filename);
        } catch (Exception e) {
            file.delete();
            throw e;
        }
        file.delete();

        ByteInterval biReloaded = ir_reloaded.getModules()
                                      .get(0)
                                      .getSections()
                                      .get(0)
                                      .getByteIntervals()
                                      .get(0);
        // Verify address was reset
        assertFalse(biReloaded.hasAddress());
        // Test set and get of address
        biReloaded.setAddress(0xDEADBEEF);
        assertEquals(biReloaded.getAddress(), OptionalLong.of(0xDEADBEEF));
        // Verify byte array content
        assertTrue(
            Arrays.equals(biReloaded.getBytes(), "SaveAndLoad".getBytes()));
    }

    @Test
    void testByteIntervalTruncation() throws Exception {
        int bytesSize = 1000;
        int intervalSize = 2000;
        int truncatedSize = 500;

        byte[] bytes = new byte[bytesSize];
        ByteInterval bi = new ByteInterval(intervalSize);

        bi.setBytes(bytes);
        assertEquals(bi.getSize(), intervalSize);
        assertEquals(bi.getInitializedSize(), bytesSize);

        bi.setSize(truncatedSize);
        assertEquals(bi.getSize(), truncatedSize);
        assertEquals(bi.getInitializedSize(), truncatedSize);
        assertEquals(bi.getBytes().length, truncatedSize);
    }

    // Run through all blocks with a ByteBlock iterator
    @Test
    public void testIterators() {
        ByteInterval bi = new ByteInterval();

        CodeBlock b1 = new CodeBlock(4, 1, CodeBlock.DecodeMode.Default);
        CodeBlock b2 = new CodeBlock(3, 3, CodeBlock.DecodeMode.Default);
        CodeBlock b3 = new CodeBlock(5, 5, CodeBlock.DecodeMode.Thumb);
        DataBlock b4 = new DataBlock(3, 2);
        DataBlock b5 = new DataBlock(3, 6);

        bi.insertByteBlock(b1);
        bi.insertByteBlock(b2);
        bi.insertByteBlock(b3);
        bi.insertByteBlock(b4);
        bi.insertByteBlock(b5);

        List<ByteBlock> blockList = bi.getBlockList();
        assertEquals(5, blockList.size());

        Iterator<ByteBlock> blocks = bi.byteBlockIterator();
        // Dump of block types
        int codeblocks = 0;
        int datablocks = 0;

        while (blocks.hasNext()) {
            ByteBlock block = blocks.next();
            // String blockType;
            if (block instanceof CodeBlock)
                codeblocks += 1;
            //	blockType = "CODE";
            else
                datablocks += 1;
            //	blockType = "DATA";
        }

        assertEquals(3, codeblocks);
        assertEquals(2, datablocks);
    }

    // Try a few ByteBlock retrieval methods
    @Test
    public void testBlockRetrieval() {
        ByteInterval bi = new ByteInterval();
        bi.setAddress(0x200D90);
        bi.setSize(14);

        CodeBlock c1 = new CodeBlock(2, 1, CodeBlock.DecodeMode.Default);
        CodeBlock c2 = new CodeBlock(2, 2, CodeBlock.DecodeMode.Default);
        CodeBlock c3 = new CodeBlock(6, 3, CodeBlock.DecodeMode.Thumb);
        CodeBlock c4 = new CodeBlock(1, 4, CodeBlock.DecodeMode.Default);
        CodeBlock c5 = new CodeBlock(3, 5, CodeBlock.DecodeMode.Default);

        DataBlock d1 = new DataBlock(5, 0);
        DataBlock d2 = new DataBlock(4, 3);
        DataBlock d3 = new DataBlock(10, 4);
        DataBlock d4 = new DataBlock(1, 6);
        DataBlock d5 = new DataBlock(1, 7);

        bi.insertByteBlock(c1);
        bi.insertByteBlock(c2);
        bi.insertByteBlock(c3);
        bi.insertByteBlock(c4);
        bi.insertByteBlock(c5);

        bi.insertByteBlock(d1);
        bi.insertByteBlock(d2);
        bi.insertByteBlock(d3);
        bi.insertByteBlock(d4);
        bi.insertByteBlock(d5);

        List<com.grammatech.gtirb.DataBlock> intersecting =
            bi.findDataBlocksOn(0x200D96);
        assertNotNull(intersecting);
        assertEquals(3, intersecting.size());
        boolean saw_d2 = false;
        boolean saw_d3 = false;
        boolean saw_d4 = false;
        for (DataBlock dataBlock : intersecting) {
            if (dataBlock == d2) {
                saw_d2 = true;
            }
            if (dataBlock == d3) {
                saw_d3 = true;
            }
            if (dataBlock == d4) {
                saw_d4 = true;
            }
        }
        assertTrue(saw_d2);
        assertTrue(saw_d3);
        assertTrue(saw_d4);

        List<com.grammatech.gtirb.CodeBlock> startingAt =
            bi.findCodeBlocksAt(0x200D93, 0x200D95);
        assertNotNull(startingAt);
        assertEquals(2, startingAt.size());
        boolean saw_c3 = false;
        boolean saw_c4 = false;
        for (CodeBlock codeBlock : startingAt) {
            if (codeBlock == c3) {
                saw_c3 = true;
            }
            if (codeBlock == c4) {
                saw_c4 = true;
            }
        }
        assertTrue(saw_c3);
        assertTrue(saw_c4);
    }
}


================================================
FILE: java/tests/TestIrSanity.java
================================================
package tests;

import static org.junit.jupiter.api.Assertions.*;

import com.grammatech.gtirb.*;
import com.grammatech.gtirb.Edge.EdgeType;
import com.grammatech.gtirb.Module;
import com.grammatech.gtirb.Module.FileFormat;
import com.grammatech.gtirb.Module.ISA;
import java.io.*;
import java.nio.charset.Charset;
import java.util.*;
import org.junit.jupiter.api.Test;

public class TestIrSanity {

    @Test
    void testCreateSaveAndLoad() throws Exception {
        // Just create a simple IR w/ 1 module
        IR ir_orig = new IR();
        Module mod =
            new Module("c:/foo.exe", 0xCAFE, 0xBEEF, Module.FileFormat.PE,
                       Module.ISA.X64, "foo.exe");
        ir_orig.addModule(mod);
        mod.setByteOrder(Module.ByteOrder.LittleEndian);
        ir_orig.setCfg(new CFG(new ArrayList<Edge>(), new ArrayList<byte[]>()));

        File file;
        file = File.createTempFile("temp", null);

        String filename = file.getName();
        try {
            ir_orig.saveFile(filename);
        } catch (Exception e) {
            file.delete();
            throw e;
        }

        IR ir_reloaded;
        try {
            ir_reloaded = IR.loadFile(filename);
        } catch (Exception e) {
            file.delete();
            throw e;
        }

        file.delete();

        assertNotNull(ir_reloaded);
        Module mod_reloaded = ir_reloaded.getModules().get(0);
        assertEquals("foo.exe", mod_reloaded.getName());
        assertEquals(ir_reloaded.getVersion(), Version.gtirbProtobufVersion);
    }

    @Test
    void testIrSetAndGet() throws Exception {
        IR ir = new IR();

        // test addModules (list)
        List<Module> modules = new ArrayList<Module>();
        modules.add(new Module(
            "/opt/testModules/testModules-1.0.0/testModule0/bin/mod",
            0x8FFFFFFF00000201L, 0x0L, FileFormat.ELF, ISA.X64, "mod0"));
        modules.add(new Module(
            "/opt/testModules/testModules-1.0.0/testModule1/bin/mod",
            0x8FFFFFFF00000401L, 0x0L, FileFormat.ELF, ISA.X64, "mod1"));
        ir.addModules(modules);
        assertTrue(ir.getModules().equals(modules));

        // test get/set version
        ir.setVersion(1234);
        assertEquals(ir.getVersion(), 1234);

        // test set/get CFG
        List<Edge> edges = new ArrayList<Edge>();
        edges.add(new Edge(UUID.randomUUID(), UUID.randomUUID(),
                           EdgeType.Branch, false, false));
        edges.add(new Edge(UUID.randomUUID(), UUID.randomUUID(), EdgeType.Call,
                           true, false));
        List<byte[]> vertices = new ArrayList<byte[]>();
        vertices.add("OneSingleVertice".getBytes());
        CFG cfg = new CFG(edges, vertices);
        ir.setCfg(cfg);
        assertEquals(ir.getCfg(), cfg);
    }

    // TODO: The next few tests here each test different ways the loadFile()
    // function can fail. Unfortunately, in its current form, it only ever
    // returns null in each case, so we can't really tell that we're getting
    // the failure we expect. This should be improved if we ever make the
    // error reporting richer in the Java API.

    @Test
    void testNonGtirbContents() throws Exception {
        // A file with non-GTIRB contents.
        byte contents[] = "JUNK".getBytes(Charset.forName("ASCII"));
        ByteArrayInputStream file_proxy = new ByteArrayInputStream(contents);
        IR ir;
        ir = IR.loadFile(file_proxy);

        // IR should be null here
        assertNull(ir);
    }

    @Test
    void testWrongVersion() throws Exception {
        // A GTIRB file w/ the wrong version.
        ByteArrayOutputStream content_builder = new ByteArrayOutputStream();
        content_builder.write("GTIRB".getBytes(Charset.forName("ASCII")));
        content_builder.write(0);
        content_builder.write(0);
        content_builder.write(255);

        byte contents[] = content_builder.toByteArray();
        ByteArrayInputStream file_proxy = new ByteArrayInputStream(contents);
        IR ir;
        ir = IR.loadFile(file_proxy);

        // IR should be null here
        assertNull(ir);
    }

    @Test
    void testCorruptedProtobuf() throws Exception {
        // A GTIRB file w/ the right version but bad protobuf.
        ByteArrayOutputStream content_builder = new ByteArrayOutputStream();
        content_builder.write("GTIRB".getBytes(Charset.forName("ASCII")));
        content_builder.write(0);
        content_builder.write(0);
        content_builder.write(Version.gtirbProtobufVersion);
        content_builder.write(255);

        byte contents[] = content_builder.toByteArray();
        ByteArrayInputStream file_proxy = new ByteArrayInputStream(contents);
        IR ir;
        ir = IR.loadFile(file_proxy);

        // IR should be null here
        assertNull(ir);
    }

    @Test
    void testAddAndRemoveModules() throws Exception {
        IR ir = new IR();
        Module mod0 = new Module("/usr/bin/mod0", 0x0000, 0x0FFF,
                                 FileFormat.ELF, ISA.X64, "mod0");
        ir.addModule(mod0);
        Module mod1 = new Module("/usr/bin/mod1", 0x1000, 0x1FFF,
                                 FileFormat.ELF, ISA.X64, "mod1");
        ir.addModule(mod1);
        Module mod2 = new Module("/usr/bin/mod2", 0x2000, 0x2FFF,
                                 FileFormat.ELF, ISA.X64, "mod2");
        ir.addModule(mod2);
        List<Module> modules = ir.getModules();
        assertEquals(modules.size(), 3);

        ir.removeModule(mod0);
        ir.removeModule(mod2);

        // Now the only module left should be "mod1"
        assertEquals("mod1", ir.getModules().get(0).getName());
        assertEquals(mod1.getIr().get(), ir);
        assertTrue(mod0.getIr().isEmpty());
        assertTrue(mod2.getIr().isEmpty());
    }

    @Test
    void testIrFindModules() throws Exception {
        IR ir = new IR();

        // test addModules (list)
        List<Module> modules = new ArrayList<Module>();
        modules.add(new Module(
            "/opt/testModules/testModules-1.0.0/testModule0/bin/mod",
            0x8FFFFFFF00000201L, 0x0L, FileFormat.ELF, ISA.X64, "mod0"));
        modules.add(new Module(
            "/opt/testModules/testModules-1.0.0/testModule1/bin/mod",
            0x8FFFFFFF00000401L, 0x0L, FileFormat.ELF, ISA.X64, "mod1"));
        modules.add(new Module(
            "/opt/testModules/testModules-1.0.0/testModule1/bin/mod-dup",
            0x8FFFFFFF00000401L, 0x0L, FileFormat.ELF, ISA.X64, "mod1"));
        ir.addModules(modules);
        assertTrue(ir.getModules().equals(modules));

        List<Module> mod0_modules = ir.findModules("mod0");
        assertEquals(1, mod0_modules.size());
        for (Module module : mod0_modules) {
            assertEquals("mod0", module.getName());
        }

        List<Module> mod1_modules = ir.findModules("mod1");
        assertEquals(2, mod1_modules.size());
        for (Module module : mod1_modules) {
            assertEquals("mod1", module.getName());
        }
    }
}


================================================
FILE: java/tests/TestModules.java
================================================
package tests;

import static org.junit.jupiter.api.Assertions.*;

import com.grammatech.gtirb.*;
import com.grammatech.gtirb.CodeBlock.DecodeMode;
import com.grammatech.gtirb.Module;
import com.grammatech.gtirb.Module.FileFormat;
import com.grammatech.gtirb.Module.ISA;
import com.grammatech.gtirb.Section.SectionFlag;
import java.io.File;
import java.util.*;
import org.junit.jupiter.api.Test;

public class TestModules {

    @Test
    void testModuleSaveAndLoad() throws Exception {
        // Just create a simple IR w/ 1 module
        IR ir_orig = new IR();
        Module mod =
            new Module("c:/foo.exe", 0xCAFE, 0xBEEF, Module.FileFormat.ELF,
                       Module.ISA.X64, "myModule");
        mod.setByteOrder(Module.ByteOrder.LittleEndian);
        ir_orig.addModule(mod);

        Section section =
            new Section("mySection", new HashSet<Section.SectionFlag>(),
                        new ArrayList<ByteInterval>());
        mod.addSection(section);

        Symbol symbol = new Symbol("mySymbol");
        mod.addSymbol(symbol);

        ProxyBlock proxyBlock = new ProxyBlock();
        mod.addProxyBlock(proxyBlock);

        File file;
        file = File.createTempFile("temp", null);

        String filename = file.getName();
        try {
            ir_orig.saveFile(filename);
        } catch (Exception e) {
            file.delete();
            throw e;
        }

        IR ir_reloaded;
        try {
            ir_reloaded = IR.loadFile(filename);
        } catch (Exception e) {
            file.delete();
            throw e;
        }

        file.delete();

        assertNotNull(ir_reloaded);
        Module mod_reloaded = ir_reloaded.getModules().get(0);
        assertEquals("myModule", mod_reloaded.getName());
        assertEquals(Module.FileFormat.ELF, mod_reloaded.getFileFormat());
        assertEquals(Module.ISA.X64, mod_reloaded.getIsa());
        assertEquals(Module.ByteOrder.LittleEndian,
                     mod_reloaded.getByteOrder());
        assertEquals(0xCAFE, mod_reloaded.getPreferredAddr());
        assertEquals(0xBEEF, mod_reloaded.getRebaseDelta());
        assertEquals("mySymbol", mod_reloaded.getSymbols().get(0).getName());
        assertEquals("mySection", mod_reloaded.getSections().get(0).getName());
        assertEquals(1, mod_reloaded.getProxyBlocks().size());
    }

    @Test
    void testModuleSetAndGet() throws Exception {

        CodeBlock entryPoint =
            new CodeBlock(0, 0, CodeBlock.DecodeMode.Default);
        String binaryPath = "/home/away/from/home.bin";
        String name = "myModule";
        long preferredAddr = 0xABCD;
        long rebaseDelta = 0x1234;
        FileFormat fileFormat = FileFormat.PE;
        ISA isa = ISA.IA32;

        Module module =
            new Module("/my/module", 0x0000, 0x0FFF, FileFormat.ELF, ISA.X64,
                       "module", new ArrayList<Section>(),
                       new ArrayList<Symbol>(), new ArrayList<ProxyBlock>(),
                       new CodeBlock(0, 0, DecodeMode.Default));
        assertNotNull(module);

        module.setBinaryPath(binaryPath);
        assertEquals(module.getBinaryPath(), binaryPath);

        module.setPreferredAddr(preferredAddr);
        assertEquals(module.getPreferredAddr(), preferredAddr);

        module.setRebaseDelta(rebaseDelta);
        assertEquals(module.getRebaseDelta(), rebaseDelta);

        module.setFileFormat(fileFormat);
        assertEquals(module.getFileFormat(), fileFormat);

        module.setIsa(isa);
        assertEquals(module.getIsa(), isa);

        module.setName(name);
        assertEquals(module.getName(), name);

        module.setEntryPoint(entryPoint);
        assertEquals(module.getEntryPoint(), entryPoint);
    }

    @Test
    void testAddAndRemoveSections() throws Exception {
        Module module =
            new Module("/my/module", 0x0000, 0x0FFF, Module.FileFormat.ELF,
                       Module.ISA.X64, "module");
        Section section0 =
            new Section("section0", new HashSet<Section.SectionFlag>(),
                        new ArrayList<ByteInterval>());
        Section section1 =
            new Section("section1", new HashSet<Section.SectionFlag>(),
                        new ArrayList<ByteInterval>());
        Section section2 =
            new Section("section2", new HashSet<Section.SectionFlag>(),
                        new ArrayList<ByteInterval>());

        module.addSection(section0);
        module.addSection(section1);
        module.addSection(section2);

        List<Section> sections = module.getSections();
        assertEquals(sections.size(), 3);

        assertEquals(section0.getModule(), Optional.of(module));
        assertEquals(section1.getModule(), Optional.of(module));
        assertEquals(section2.getModule(), Optional.of(module));
        module.removeSection(section0);
        module.removeSection(section1);
        assertTrue(section0.getModule().isEmpty());
        assertTrue(section1.getModule().isEmpty());
        assertEquals(section2.getModule(), Optional.of(module));

        // Now the only section left should be "section2"
        sections = module.getSections();
        assertEquals(sections.size(), 1);
        assertEquals("section2", sections.get(0).getName());
    }

    @Test
    void testAddAndRemoveSymbols() throws Exception {
        Module module =
            new Module("/my/module", 0x0000, 0x0FFF, Module.FileFormat.ELF,
                       Module.ISA.X64, "module");
        Symbol symbol0 = new Symbol("symbol0");
        Symbol symbol1 = new Symbol("symbol1");
        Symbol symbol2 = new Symbol("symbol2");

        module.addSymbol(symbol0);
        module.addSymbol(symbol2);
        module.addSymbol(symbol1);

        List<Symbol> symbols = module.getSymbols();
        assertEquals(symbols.size(), 3);

        assertEquals(symbol0.getModule(), Optional.of(module));
        assertEquals(symbol1.getModule(), Optional.of(module));
        assertEquals(symbol2.getModule(), Optional.of(module));
        module.removeSymbol(symbol2);
        module.removeSymbol(symbol0);
        assertTrue(symbol0.getModule().isEmpty());
        assertEquals(symbol1.getModule(), Optional.of(module));
        assertTrue(symbol2.getModule().isEmpty());

        // Now the only symbol left should be "symbol1"
        symbols = module.getSymbols();
        assertEquals(symbols.size(), 1);
        assertEquals("symbol1", symbols.get(0).getName());
    }

    @Test
    void testAddAndRemoveProxyBlocks() throws Exception {
        Module module =
            new Module("/my/module", 0x0000, 0x0FFF, Module.FileFormat.ELF,
                       Module.ISA.X64, "module");
        ProxyBlock proxyBlock0 = new ProxyBlock();
        ProxyBlock proxyBlock1 = new ProxyBlock();
        ProxyBlock proxyBlock2 = new ProxyBlock();

        module.addProxyBlock(proxyBlock2);
        module.addProxyBlock(proxyBlock1);
        module.addProxyBlock(proxyBlock0);

        List<ProxyBlock> proxyBlocks = module.getProxyBlocks();
        assertEquals(proxyBlocks.size(), 3);

        assertEquals(proxyBlock0.getModule(), Optional.of(module));
        assertEquals(proxyBlock1.getModule(), Optional.of(module));
        assertEquals(proxyBlock2.getModule(), Optional.of(module));
        module.removeProxyBlock(proxyBlock0);
        module.removeProxyBlock(proxyBlock2);
        module.removeProxyBlock(proxyBlock1);
        assertTrue(proxyBlock0.getModule().isEmpty());
        assertTrue(proxyBlock1.getModule().isEmpty());
        assertTrue(proxyBlock2.getModule().isEmpty());

        assertEquals(module.getProxyBlocks().size(), 0);
    }

    @Test
    void testModuleFindSections() throws Exception {

        Module module = new Module("module", 0x0000, 0x0FFF, FileFormat.ELF,
                                   ISA.X64, "module");
        Set<SectionFlag> flags = new HashSet<SectionFlag>();
        flags.add(SectionFlag.Readable);
        flags.add(SectionFlag.Writable);

        ArrayList<ByteInterval> biList1 = new ArrayList<ByteInterval>();
        biList1.add(new ByteInterval(null, 0x0));
        biList1.get(0).setSize(0x100000);
        Section section1 = new Section("Section1", flags, biList1);
        module.addSection(section1);

        ArrayList<ByteInterval> biList2 = new ArrayList<ByteInterval>();
        biList2.add(new ByteInterval(null, 0x100000));
        biList2.get(0).setSize(0x100000);
        Section section2 = new Section("Section2", flags, biList2);
        module.addSection(section2);

        ArrayList<ByteInterval> biList3 = new ArrayList<ByteInterval>();
        biList3.add(new ByteInterval(null, 0x200000));
        biList3.get(0).setSize(0x100000);
        Section section3 = new Section("Section3", flags, biList3);
        module.addSection(section3);

        // Find sections that contain an address - single
        List<Section> sectionsOn1 = module.findSectionsOn(0x7FFF);
        assertEquals(sectionsOn1.size(), 1);
        assertEquals(sectionsOn1.get(0), section1);

        // Find sections that contain an address - range
        List<Section> sectionsOn2 = module.findSectionsOn(0x180000, 0x280000);
        assertEquals(sectionsOn2.size(), 2);
        assertEquals(sectionsOn2.get(0), section2);
        assertEquals(sectionsOn2.get(1), section3);

        // Find sections that start at an address - single
        List<Section> sectionsAt1 = module.findSectionsAt(0x0);
        assertEquals(sectionsAt1.size(), 1);
        assertEquals(sectionsAt1.get(0), section1);

        // Find sections that start at an address - range
        List<Section> sectionsAt2 = module.findSectionsAt(0x180000, 0x280000);
        assertEquals(sectionsAt2.size(), 1);
        assertEquals(sectionsAt2.get(0), section3);
    }
}


================================================
FILE: java/tests/TestSections.java
================================================
package tests;

import static org.junit.jupiter.api.Assertions.*;

import com.grammatech.gtirb.*;
import com.grammatech.gtirb.Module;
import java.io.File;
import java.util.*;
import org.junit.jupiter.api.Test;

public class TestSections {

    @Test
    void testSectionSaveAndLoad() throws Exception {
        // Just create a simple IR w/ 1 module
        IR ir_orig = new IR();
        Module mod =
            new Module("c:/foo.exe", 0xCAFE, 0xBEEF, Module.FileFormat.ELF,
                       Module.ISA.X64, "myModule");
        ir_orig.addModule(mod);

        Section section =
            new Section("mySection", new HashSet<Section.SectionFlag>(),
                        new ArrayList<ByteInterval>());
        mod.addSection(section);

        section.addSectionFlag(Section.SectionFlag.Readable);
        section.addSectionFlag(Section.SectionFlag.Writable);
        section.addSectionFlag(Section.SectionFlag.Executable);

        ByteInterval bi = new ByteInterval();
        section.addByteInterval(bi);

        section.removeSectionFlag(Section.SectionFlag.Executable);

        File file;
        file = File.createTempFile("temp", null);

        String filename = file.getName();
        try {
            ir_orig.saveFile(filename);
        } catch (Exception e) {
            file.delete();
            throw e;
        }

        IR ir_reloaded;
        try {
            ir_reloaded = IR.loadFile(filename);
        } catch (Exception e) {
            file.delete();
            throw e;
        }

        file.delete();

        assertNotNull(ir_reloaded);
        Module mod_reloaded = ir_reloaded.getModules().get(0);
        Section section_reloaded = mod_reloaded.getSections().get(0);
        Set<Section.SectionFlag> flagSet = section_reloaded.getSectionFlags();

        assertTrue(flagSet.contains(Section.SectionFlag.Readable));
        assertTrue(flagSet.contains(Section.SectionFlag.Writable));
        assertFalse(flagSet.contains(Section.SectionFlag.Executable));
        assertEquals(section_reloaded.getByteIntervals().size(), 1);
    }

    @Test
    void testSectionSetAndGet() throws Exception {
        String name = ".code";
        long address = 0x8FFFFFFF;
        long size = 0x40000;

        Section section =
            new Section("newSection", new HashSet<Section.SectionFlag>(),
                        new ArrayList<ByteInterval>());
        section.setName(name);
        assertEquals(section.getName(), name);

        ByteInterval bi = new ByteInterval();
        bi.setAddress(address);
        bi.setSize(size);

        CodeBlock b1 = new CodeBlock(4, 1, CodeBlock.DecodeMode.Default);
        bi.insertByteBlock(b1);

        section.addByteInterval(bi);

        assertEquals(section.getAddress(), OptionalLong.of(address));
        assertEquals(section.getSize(), size);
    }

    @Test
    void testSectionWithIntervalAddresses() throws Exception {
        ArrayList<ByteInterval> biList = new ArrayList<ByteInterval>();
        ByteInterval bi1 = new ByteInterval(null, 0x0);
        bi1.setSize(0x100000);
        biList.add(bi1);
        ByteInterval bi2 = new ByteInterval(null, 0x100000);
        bi2.setSize(0x100000);
        biList.add(bi2);
        ByteInterval bi3 = new ByteInterval(null, 0x200000);
        bi3.setSize(0x100000);
        biList.add(bi3);
        Section section =
            new Section("Section", new HashSet<Section.SectionFlag>(), biList);
        assertEquals(section.getAddress(), OptionalLong.of(0x0));
        assertEquals(section.getSize(), 0x300000L);

        // Find intervals that contain an address - single
        List<ByteInterval> biOn1 = section.findByteIntervalsOn(0x180000);
        assertEquals(biOn1.size(), 1);
        assertEquals(biOn1.get(0), bi2);

        // Find intervals that contain an address - range
        List<ByteInterval> biOn2 =
            section.findByteIntervalsOn(0x80000, 0x180000);
        assertEquals(biOn2.size(), 2);
        assertEquals(biOn2.get(0), bi1);
        assertEquals(biOn2.get(1), bi2);

        // Find intervals that start at an address - single
        List<ByteInterval> biAt1 = section.findByteIntervalsAt(0x100000);
        assertEquals(biAt1.size(), 1);
        assertEquals(biAt1.get(0), bi2);

        // Find intervals that start at an address - range
        List<ByteInterval> biAt2 =
            section.findByteIntervalsAt(0x80000, 0x180000);
        assertEquals(biAt2.size(), 1);
        assertEquals(biAt2.get(0), bi2);
    }

    @Test
    void testSectionNoAddressIntervals() throws Exception {
        Section section =
            new Section("aSection", new HashSet<Section.SectionFlag>(),
                        new ArrayList<ByteInterval>());

        ByteInterval bi1 = new ByteInterval(null, 0x0);
        bi1.setSize(0x100000);
        section.addByteInterval(bi1);

        // bi2 is a ByteInterval without an address, making the calculation of
        // address and size for the section impossible
        ByteInterval bi2 = new ByteInterval();
        bi2.setSize(0x100000);
        section.addByteInterval(bi2);

        ByteInterval bi3 = new ByteInterval(null, 0x400000);
        bi3.setSize(0x100000);
        section.addByteInterval(bi3);

        assertEquals(section.getAddress(), OptionalLong.empty());
        assertEquals(section.getSize(), 0L);
    }

    @Test
    void testAddAndRemoveFlags() throws Exception {
        Section section =
            new Section("section", new HashSet<Section.SectionFlag>(),
                        new ArrayList<ByteInterval>());

        section.addSectionFlag(Section.SectionFlag.ThreadLocal);
        section.addSectionFlag(Section.SectionFlag.Loaded);
        assertEquals(section.getSectionFlags().size(), 2);

        // Add same flag again should not increase list size
        section.addSectionFlag(Section.SectionFlag.Loaded);
        assertEquals(section.getSectionFlags().size(), 2);

        // Remove a flag not set should return false
        assertFalse(section.removeSectionFlag(Section.SectionFlag.Initialized));

        // Remove a flag that is set
        section.removeSectionFlag(Section.SectionFlag.ThreadLocal);
        assertEquals(section.getSectionFlags().size(), 1);
    }

    @Test
    void testAddAndRemoveByteIntervals() throws Exception {
        Section section =
            new Section("section", new HashSet<Section.SectionFlag>(),
                        new ArrayList<ByteInterval>());

        ByteInterval bi = new ByteInterval();
        assertTrue(section.getModule().isEmpty());
        assertTrue(bi.getSection().isEmpty());

        section.addByteInterval(bi);
        assertEquals(bi.getSection().get(), section);
        assertTrue(section.getByteIntervals().contains(bi));

        assertTrue(section.removeByteInterval(bi));
        assertTrue(bi.getSection().isEmpty());
        assertEquals(section.getByteIntervals().size(), 0);
    }
}


================================================
FILE: java/tests/TestSymbolicExpressions.java
================================================
package tests;

import static org.junit.jupiter.api.Assertions.*;

import com.grammatech.gtirb.*;
import com.grammatech.gtirb.CodeBlock.DecodeMode;
import com.grammatech.gtirb.Module;
import com.grammatech.gtirb.Module.FileFormat;
import com.grammatech.gtirb.Module.ISA;
import com.grammatech.gtirb.SymbolicExpression.AttributeFlag;
import java.io.*;
import java.util.*;
import org.junit.jupiter.api.Test;

class TestSymbolicExpressions {

    // Test forward compatibility for unknown symbolic expression attributes.
    @Test
    void testUnknownAttributes() throws Exception {
        // Build minimal IR.

        IR ir = new IR();
        Module module = new Module("", 0, 0, FileFormat.ELF, ISA.X64, "test");
        Section section = new Section("foo", new HashSet<Section.SectionFlag>(),
                                      new ArrayList<ByteInterval>());
        Symbol symbol = new Symbol("bar", 0);
        ByteInterval byteInterval = new ByteInterval();
        SymbolicExpression expr =
            new SymAddrConst(0, symbol.getUuid(), new HashSet<AttributeFlag>());
        expr.addAttributeFlag(AttributeFlag.GOT);
        expr.addUnknownFlag(0xBEEF);
        byteInterval.insertSymbolicExpression(0, expr);

        // byteIntervals.add(byteInterval);
        section.addByteInterval(byteInterval);
        module.addSection(section);
        ir.addModule(module);

        // Write IR to file.
        ByteArrayOutputStream output = new ByteArrayOutputStream();
        ir.saveFile(output);

        // Load IR from file.
        ByteArrayInputStream input =
            new ByteArrayInputStream(output.toByteArray());
        ir = IR.loadFile(input);

        module = ir.getModules().get(0);
        section = module.getSections().get(0);
        byteInterval = section.getByteIntervals().get(0);
        expr = (SymbolicExpression)byteInterval.symbolicExpressionIterator()
                   .next()
                   .getValue();

        assertTrue(expr.getAttributeFlags().contains(AttributeFlag.GOT));
        assertTrue(expr.getUnknownAttributeFlags().contains(0xBEEF));
    }

    @Test
    void testSexprSetAndGet() throws Exception {
        Set<AttributeFlag> flags = new HashSet<AttributeFlag>();
        flags.add(AttributeFlag.PLT);
        CodeBlock codeBlockA = new CodeBlock(0x10L, 0x400L, DecodeMode.Default);
        CodeBlock codeBlockB = new CodeBlock(0x10L, 0x500L, DecodeMode.Default);

        // test set/get of decode mode
        codeBlockB.setDecodeMode(DecodeMode.Thumb);
        assertEquals(codeBlockB.getDecodeMode(), DecodeMode.Thumb);

        // test SymAddrAddr constructor
        Symbol symbolA = new Symbol("CodeBlockA", codeBlockA.getUuid());
        Symbol symbolB = new Symbol("CodeBlockB", codeBlockB.getUuid());
        SymbolicExpression expr = new SymAddrAddr(0x100L, 1L, symbolA.getUuid(),
                                                  symbolB.getUuid(), flags);

        // test adding and removing attribute flags
        expr.addAttributeFlag(AttributeFlag.S);
        assertEquals(expr.getAttributeFlags().size(), 2);
        expr.addAttributeFlag(AttributeFlag.PLT);
        assertEquals(expr.getAttributeFlags().size(), 2);
        expr.removeAttributeFlag(AttributeFlag.S);
        assertEquals(expr.getAttributeFlags().size(), 1);
        expr.removeUnknownFlag(0xF00eee);
        assertEquals(expr.getUnknownAttributeFlags().size(), 0);
    }
}


================================================
FILE: java/tests/TestSymbols.java
================================================
package tests;

import static org.junit.jupiter.api.Assertions.*;

import com.grammatech.gtirb.*;
import com.grammatech.gtirb.Module;
import java.io.File;
import java.util.*;
import org.junit.jupiter.api.Test;

public class TestSymbols {

    @Test
    void testSymbolSaveAndLoad() throws Exception {
        // Just create a simple IR w/ 1 module
        IR ir_orig = new IR();
        Module mod =
            new Module("c:/foo.exe", 0xCAFE, 0xBEEF, Module.FileFormat.ELF,
                       Module.ISA.X64, "myModule");
        ir_orig.addModule(mod);

        UUID referentUuid = UUID.randomUUID();
        long symbolValue = 0x5A3C;
        // Symbol with no payload
        Symbol symbol0 = new Symbol("symbol0");
        // Symbol with value payload
        Symbol symbol1 = new Symbol("symbol1", symbolValue);
        // Symbol with referent payload
        Symbol symbol2 = new Symbol("symbol2", referentUuid);

        mod.addSymbol(symbol2);
        mod.addSymbol(symbol1);
        mod.addSymbol(symbol0);

        File file;
        file = File.createTempFile("temp", null);

        String filename = file.getName();
        try {
            ir_orig.saveFile(filename);
        } catch (Exception e) {
            file.delete();
            throw e;
        }

        IR ir_reloaded;
        try {
            ir_reloaded = IR.loadFile(filename);
        } catch (Exception e) {
            file.delete();
            throw e;
        }

        file.delete();

        assertNotNull(ir_reloaded);
        Module mod_reloaded = ir_reloaded.getModules().get(0);

        List<Symbol> symbols = mod_reloaded.getSymbols();
        for (Symbol symbol : symbols) {
            assertEquals(symbol.getModule(), Optional.of(mod_reloaded));
            if (symbol.getName().equals("symbol0")) {
                assertEquals(symbol.getPayloadType(), Symbol.PayloadType.NONE);
                assertEquals(symbol.getValue(), OptionalLong.empty());
                assertEquals(symbol.getReferentUuid(), Optional.empty());
            } else if (symbol.getName().equals("symbol1")) {
                assertEquals(symbol.getPayloadType(), Symbol.PayloadType.VALUE);
                assertEquals(symbol.getValue(), OptionalLong.of(symbolValue));
                assertEquals(symbol.getReferentUuid(), Optional.empty());
            } else if (symbol.getName().equals("symbol2")) {
                assertEquals(symbol.getPayloadType(),
                             Symbol.PayloadType.REFERENT);
                assertEquals(symbol.getValue(), OptionalLong.empty());
                assertEquals(symbol.getReferentUuid(),
                             Optional.of(referentUuid));
            } else
                fail("Found an unrecognized symbol: " + symbol.getName());
        }
    }

    @Test
    void testSymbolSetAndGet() throws Exception {

        Symbol symbol = new Symbol("badName");
        symbol.setAtEnd(true);
        symbol.setName("goodName");

        CodeBlock codeBlock =
            new CodeBlock(0x10L, 0x400L, CodeBlock.DecodeMode.Default);
        long symbolValue = 0x5A3C;

        // test that setting a referent sets the payload type to REFERENT
        symbol.setReferentUuid(codeBlock.getUuid());
        assertEquals(symbol.getReferentUuid(),
                     Optional.of(codeBlock.getUuid()));
        assertEquals(symbol.getPayloadType(), Symbol.PayloadType.REFERENT);
        assertEquals(symbol.getReferent(), codeBlock);

        // test that setting a value sets the payload type to VALUE
        symbol.setValue(symbolValue);
        assertEquals(symbol.getValue(), OptionalLong.of(symbolValue));
        assertEquals(symbol.getPayloadType(), Symbol.PayloadType.VALUE);

        // test that symbol properties have held
        assertEquals(symbol.getModule(), Optional.empty());
        assertEquals(symbol.isAtEnd(), true);
        assertEquals(symbol.getName(), "goodName");
    }
}


================================================
FILE: java/tests/TestTuple.java
================================================
package tests;

import static org.junit.jupiter.api.Assertions.*;

import com.grammatech.gtirb.tuple.Tuple1;
import com.grammatech.gtirb.tuple.Tuple2;
import com.grammatech.gtirb.tuple.Tuple3;
import com.grammatech.gtirb.tuple.Tuple4;
import com.grammatech.gtirb.tuple.Tuple5;
import org.junit.jupiter.api.Test;

class BarSingle extends Tuple1<String> {
    public BarSingle(String s) { super(s); }
    public String getString() { return this.get0(); }
}

class BarPair extends Tuple2<String, Long> {
    public BarPair(String s, Long l) { super(s, l); }
    public String getString() { return this.get0(); }
    public Long getLong() { return this.get1(); }
}

class BarTriple extends Tuple3<String, Long, Float> {
    public BarTriple(String s, Long l, Float f) { super(s, l, f); }
    public String getString() { return this.get0(); }
    public Long getLong() { return this.get1(); }
    public Float getFloat() { return this.get2(); }
}

class BarQuadruple extends Tuple4<String, Long, Float, Boolean> {
    public BarQuadruple(String s, Long l, Float f, Boolean b) {
        super(s, l, f, b);
    }
    public String getString() { return this.get0(); }
    public Long getLong() { return this.get1(); }
    public Float getFloat() { return this.get2(); }
    public Boolean getBoolean() { return this.get3(); }
}

class BarQuintuple extends Tuple5<String, Long, Float, Boolean, Integer> {
    public BarQuintuple(String s, Long l, Float f, Boolean b, Integer i) {
        super(s, l, f, b, i);
    }
    public String getString() { return this.get0(); }
    public Long getLong() { return this.get1(); }
    public Float getFloat() { return this.get2(); }
    public Boolean getBoolean() { return this.get3(); }
    public Integer getInteger() { return this.get4(); }
}

public class TestTuple {
    @Test
    public void testTuple1() {
        BarSingle f1 = new BarSingle("abc");
        assertEquals("abc", f1.getString());
        BarSingle f2 = new BarSingle("abc");
        assertEquals(f1, f2);
        BarSingle f3 = new BarSingle("def");
        assertNotEquals(f1, f3);
    }

    @Test
    public void testTuple2() {
        BarPair f1 = new BarPair("abc", 42L);
        assertEquals("abc", f1.getString());
        assertEquals(42L, f1.getLong());
        BarPair f2 = new BarPair("abc", 42L);
        assertEquals(f1, f2);
        BarPair f3 = new BarPair("def", 43L);
        assertNotEquals(f1, f3);
        BarPair f4 = new BarPair("abc", 43L);
        assertNotEquals(f1, f4);
    }

    @Test
    public void testTuple3() {
        BarTriple f1 = new BarTriple("abc", 42L, 3.14f);
        assertEquals("abc", f1.getString());
        assertEquals(42L, f1.getLong());
        assertEquals(3.14f, f1.getFloat());
        BarTriple f2 = new BarTriple("abc", 42L, 3.14f);
        assertEquals(f1, f2);
        BarTriple f3 = new BarTriple("def", 42L, 3.14f);
        assertNotEquals(f1, f3);
        BarTriple f4 = new BarTriple("abc", 43L, 3.14f);
        assertNotEquals(f1, f4);
        BarTriple f5 = new BarTriple("abc", 42L, 3.15f);
        assertNotEquals(f1, f5);
    }

    @Test
    public void testTuple4() {
        BarQuadruple f1 = new BarQuadruple("abc", 42L, 3.14f, true);
        assertEquals("abc", f1.getString());
        assertEquals(42L, f1.getLong());
        assertEquals(3.14f, f1.getFloat());
        assertEquals(true, f1.getBoolean());
        BarQuadruple f2 = new BarQuadruple("abc", 42L, 3.14f, true);
        assertEquals(f1, f2);
        BarQuadruple f3 = new BarQuadruple("def", 42L, 3.14f, true);
        assertNotEquals(f1, f3);
        BarQuadruple f4 = new BarQuadruple("abc", 43L, 3.14f, true);
        assertNotEquals(f1, f4);
        BarQuadruple f5 = new BarQuadruple("abc", 42L, 3.15f, true);
        assertNotEquals(f1, f5);
        BarQuadruple f6 = new BarQuadruple("abc", 42L, 3.14f, false);
        assertNotEquals(f1, f6);
    }

    @Test
    public void testTuple5() {
        BarQuintuple f1 = new BarQuintuple("abc", 42L, 3.14f, true, 10);
        assertEquals("abc", f1.getString());
        assertEquals(42L, f1.getLong());
        assertEquals(3.14f, f1.getFloat());
        assertEquals(true, f1.getBoolean());
        assertEquals(10, f1.getInteger());
        BarQuintuple f2 = new BarQuintuple("abc", 42L, 3.14f, true, 10);
        assertEquals(f1, f2);
        BarQuintuple f3 = new BarQuintuple("def", 42L, 3.14f, true, 10);
        assertNotEquals(f1, f3);
        BarQuintuple f4 = new BarQuintuple("abc", 43L, 3.14f, true, 10);
        assertNotEquals(f1, f4);
        BarQuintuple f5 = new BarQuintuple("abc", 42L, 3.15f, true, 10);
        assertNotEquals(f1, f5);
        BarQuintuple f6 = new BarQuintuple("abc", 42L, 3.14f, false, 10);
        assertNotEquals(f1, f6);
        BarQuintuple f7 = new BarQuintuple("abc", 42L, 3.14f, true, 11);
        assertNotEquals(f1, f7);
    }
}


================================================
FILE: java/tests/TestVariant.java
================================================
package tests;

import static org.junit.jupiter.api.Assertions.*;

import com.grammatech.gtirb.Offset;
import com.grammatech.gtirb.variant.Token;
import com.grammatech.gtirb.variant.Variant11;
import com.grammatech.gtirb.variant.Variant2;
import com.grammatech.gtirb.variant.Variant3;
import java.util.Optional;
import java.util.UUID;
import org.junit.jupiter.api.Test;

class BarVariant2 extends Variant2<Long, Float> {
    private BarVariant2(Token.T0 tok, Long l) { super(tok, l); }
    private BarVariant2(Token.T1 tok, Float f) { super(tok, f); }
    public Optional<Long> getLong() { return this.get0(); }
    public Optional<Float> getFloat() { return this.get1(); }
    public void setLong(Long l) { this.set0(l); }
    public void setFloat(Float f) { this.set1(f); }
    public static BarVariant2 ofLong(Long l) {
        return new BarVariant2(new Token.T0(), l);
    }
    public static BarVariant2 ofFloat(Float f) {
        return new BarVariant2(new Token.T1(), f);
    }
}

class BarVariant3 extends Variant3<Long, Float, Boolean> {
    private BarVariant3(Token.T0 tok, Long l) { super(tok, l); }
    private BarVariant3(Token.T1 tok, Float f) { super(tok, f); }
    private BarVariant3(Token.T2 tok, Boolean b) { super(tok, b); }
    public Optional<Long> getLong() { return this.get0(); }
    public Optional<Float> getFloat() { return this.get1(); }
    public Optional<Boolean> getBoolean() { return this.get2(); }
    public void setLong(Long l) { this.set0(l); }
    public void setFloat(Float f) { this.set1(f); }
    public void setBoolean(Boolean b) { this.set2(b); }
    public static BarVariant3 ofLong(Long l) {
        return new BarVariant3(new Token.T0(), l);
    }
    public static BarVariant3 ofFloat(Float f) {
        return new BarVariant3(new Token.T1(), f);
    }
    public static BarVariant3 ofBoolean(Boolean b) {
        return new BarVariant3(new Token.T2(), b);
    }
}

class BarVariant11
    extends Variant11<Long, Float, Boolean, Integer, String, Long, Float,
                      Boolean, Integer, String, Offset> {
    private BarVariant11(Token.T0 tok, Long l) { super(tok, l); }
    private BarVariant11(Token.T1 tok, Float f) { super(tok, f); }
    private BarVariant11(Token.T2 tok, Boolean b) { super(tok, b); }
    private BarVariant11(Token.T3 tok, Integer i) { super(tok, i); }
    private BarVariant11(Token.T4 tok, String s) { super(tok, s); }
    private BarVariant11(Token.T5 tok, Long l) { super(tok, l); }
    private BarVariant11(Token.T6 tok, Float f) { super(tok, f); }
    private BarVariant11(Token.T7 tok, Boolean b) { super(tok, b); }
    private BarVariant11(Token.T8 tok, Integer i) { super(tok, i); }
    private BarVariant11(Token.T9 tok, String s) { super(tok, s); }
    private BarVariant11(Token.T10 tok, Offset o) { super(tok, o); }
    public Optional<Long> getLong1() { return this.get0(); }
    public Optional<Float> getFloat1() { return this.get1(); }
    public Optional<Boolean> getBoolean1() { return this.get2(); }
    public Optional<Integer> getInteger1() { return this.get3(); }
    public Optional<String> getString1() { return this.get4(); }
    public Optional<Long> getLong2() { return this.get5(); }
    public Optional<Float> getFloat2() { return this.get6(); }
    public Optional<Boolean> getBoolean2() { return this.get7(); }
    public Optional<Integer> getInteger2() { return this.get8(); }
    public Optional<String> getString2() { return this.get9(); }
    public Optional<Offset> getOffset() { return this.get10(); }
    public void setLong1(Long l) { this.set0(l); }
    public void setFloat1(Float f) { this.set1(f); }
    public void setBoolean1(Boolean b) { this.set2(b); }
    public void setInteger1(Integer i) { this.set3(i); }
    public void setString1(String s) { this.set4(s); }
    public void setLong2(Long l) { this.set5(l); }
    public void setFloat2(Float f) { this.set6(f); }
    public void setBoolean2(Boolean b) { this.set7(b); }
    public void setInteger2(Integer i) { this.set8(i); }
    public void setString2(String s) { this.set9(s); }
    public void setOffset(Offset o) { this.set10(o); }
    public static BarVariant11 ofLong1(Long l) {
        return new BarVariant11(new Token.T0(), l);
    }
    public static BarVariant11 ofFloat1(Float f) {
        return new BarVariant11(new Token.T1(), f);
    }
    public static BarVariant11 ofBoolean1(Boolean b) {
        return new BarVariant11(new Token.T2(), b);
    }
    public static BarVariant11 ofInteger1(Integer i) {
        return new BarVariant11(new Token.T3(), i);
    }
    public static BarVariant11 ofString1(String s) {
        return new BarVariant11(new Token.T4(), s);
    }
    public static BarVariant11 ofLong2(Long l) {
        return new BarVariant11(new Token.T5(), l);
    }
    public static BarVariant11 ofFloat2(Float f) {
        return new BarVariant11(new Token.T6(), f);
    }
    public static BarVariant11 ofBoolean2(Boolean b) {
        return new BarVariant11(new Token.T7(), b);
    }
    public static BarVariant11 ofInteger2(Integer i) {
        return new BarVariant11(new Token.T8(), i);
    }
    public static BarVariant11 ofString2(String s) {
        return new BarVariant11(new Token.T9(), s);
    }
    public static BarVariant11 ofOffset(Offset o) {
        return new BarVariant11(new Token.T10(), o);
    }
}

public class TestVariant {
    @Test
    public void testVariant2() {
        BarVariant2 fv1 = BarVariant2.ofLong(42L);
        assertEquals(Optional.of(42L), fv1.getLong());
        assertEquals(Optional.empty(), fv1.getFloat());
        fv1.setLong(43L);
        assertEquals(Optional.of(43L), fv1.getLong());
        assertEquals(Optional.empty(), fv1.getFloat());
        fv1.setFloat(3.14f);
        assertEquals(Optional.empty(), fv1.getLong());
        assertEquals(Optional.of(3.14f), fv1.getFloat());

        BarVariant2 fv2 = BarVariant2.ofFloat(3.14f);
        assertEquals(Optional.empty(), fv2.getLong());
        assertEquals(Optional.of(3.14f), fv2.getFloat());
        assertEquals(fv1, fv2);
    }

    @Test
    public void testVariant3() {
        BarVariant3 fv1 = BarVariant3.ofLong(42L);
        assertEquals(Optional.of(42L), fv1.getLong());
        assertEquals(Optional.empty(), fv1.getFloat());
        assertEquals(Optional.empty(), fv1.getBoolean());
        fv1.setLong(43L);
        assertEquals(Optional.of(43L), fv1.getLong());
        assertEquals(Optional.empty(), fv1.getFloat());
        assertEquals(Optional.empty(), fv1.getBoolean());
        fv1.setBoolean(true);
        assertEquals(Optional.empty(), fv1.getLong());
        assertEquals(Optional.empty(), fv1.getFloat());
        assertEquals(Optional.of(true), fv1.getBoolean());
        fv1.setFloat(3.14f);
        assertEquals(Optional.empty(), fv1.getLong());
        assertEquals(Optional.of(3.14f), fv1.getFloat());
        assertEquals(Optional.empty(), fv1.getBoolean());

        BarVariant3 fv2 = BarVariant3.ofFloat(3.14f);
        assertEquals(Optional.empty(), fv2.getLong());
        assertEquals(Optional.of(3.14f), fv2.getFloat());
        assertEquals(Optional.empty(), fv2.getBoolean());
        assertEquals(fv1, fv2);

        BarVariant3 fv3 = BarVariant3.ofBoolean(false);
        assertEquals(Optional.empty(), fv3.getLong());
        assertEquals(Optional.empty(), fv3.getFloat());
        assertEquals(Optional.of(false), fv3.getBoolean());
    }

    @Test
    public void testVariant11() {
        BarVariant11 fv1 = BarVariant11.ofLong1(42L);
        assertEquals(Optional.of(42L), fv1.getLong1());
        assertEquals(Optional.empty(), fv1.getFloat1());
        assertEquals(Optional.empty(), fv1.getBoolean1());
        assertEquals(Optional.empty(), fv1.getInteger1());
        assertEquals(Optional.empty(), fv1.getString1());
        assertEquals(Optional.empty(), fv1.getLong2());
        assertEquals(Optional.empty(), fv1.getFloat2());
        assertEquals(Optional.empty(), fv1.getBoolean2());
        assertEquals(Optional.empty(), fv1.getInteger2());
        assertEquals(Optional.empty(), fv1.getString2());
        assertEquals(Optional.empty(), fv1.getOffset());
        fv1.setLong1(43L);
        assertEquals(Optional.of(43L), fv1.getLong1());
        assertEquals(Optional.empty(), fv1.getFloat1());
        assertEquals(Optional.empty(), fv1.getBoolean1());
        assertEquals(Optional.empty(), fv1.getInteger1());
        assertEquals(Optional.empty(), fv1.getString1());
        assertEquals(Optional.empty(), fv1.getLong2());
        assertEquals(Optional.empty(), fv1.getFloat2());
        assertEquals(Optional.empty(), fv1.getBoolean2());
        assertEquals(Optional.empty(), fv1.getInteger2());
        assertEquals(Optional.empty(), fv1.getString2());
        assertEquals(Optional.empty(), fv1.getOffset());
        fv1.setBoolean1(true);
        assertEquals(Optional.empty(), fv1.getLong1());
        assertEquals(Optional.empty(), fv1.getFloat1());
        assertEquals(Optional.of(true), fv1.getBoolean1());
        assertEquals(Optional.empty(), fv1.getInteger1());
        assertEquals(Optional.empty(), fv1.getString1());
        assertEquals(Optional.empty(), fv1.getLong2());
        assertEquals(Optional.empty(), fv1.getFloat2());
        assertEquals(Optional.empty(), fv1.getBoolean2());
        assertEquals(Optional.empty(), fv1.getInteger2());
        assertEquals(Optional.empty(), fv1.getString2());
        assertEquals(Optional.empty(), fv1.getOffset());
        fv1.setInteger1(44);
        assertEquals(Optional.empty(), fv1.getLong1());
        assertEquals(Optional.empty(), fv1.getFloat1());
        assertEquals(Optional.empty(), fv1.getBoolean1());
        assertEquals(Optional.of(44), fv1.getInteger1());
        assertEquals(Optional.empty(), fv1.getString1());
        assertEquals(Optional.empty(), fv1.getLong2());
        assertEquals(Optional.empty(), fv1.getFloat2());
        assertEquals(Optional.empty(), fv1.getBoolean2());
        assertEquals(Optional.empty(), fv1.getInteger2());
        assertEquals(Optional.empty(), fv1.getString2());
        assertEquals(Optional.empty(), fv1.getOffset());
        fv1.setString1("abc");
        assertEquals(Optional.empty(), fv1.getLong1());
        assertEquals(Optional.empty(), fv1.getFloat1());
        assertEquals(Optional.empty(), fv1.getBoolean1());
        assertEquals(Optional.empty(), fv1.getInteger1());
        assertEquals(Optional.of("abc"), fv1.getString1());
        assertEquals(Optional.empty(), fv1.getLong2());
        assertEquals(Optional.empty(), fv1.getFloat2());
        assertEquals(Optional.empty(), fv1.getBoolean2());
        assertEquals(Optional.empty(), fv1.getInteger2());
        assertEquals(Optional.empty(), fv1.getString2());
        assertEquals(Optional.empty(), fv1.getOffset());
        fv1.setLong2(45L);
        assertEquals(Optional.empty(), fv1.getLong1());
        assertEquals(Optional.empty(), fv1.getFloat1());
        assertEquals(Optional.empty(), fv1.getBoolean1());
        assertEquals(Optional.empty(), fv1.getInteger1());
        assertEquals(Optional.empty(), fv1.getString1());
        assertEquals(Optional.of(45L), fv1.getLong2());
        assertEquals(Optional.empty(), fv1.getFloat2());
        assertEquals(Optional.empty(), fv1.getBoolean2());
        assertEquals(Optional.empty(), fv1.getInteger2());
        assertEquals(Optional.empty(), fv1.getString2());
        assertEquals(Optional.empty(), fv1.getOffset());
        fv1.setFloat2(3.16f);
        assertEquals(Optional.empty(), fv1.getLong1());
        assertEquals(Optional.empty(), fv1.getFloat1());
        assertEquals(Optional.empty(), fv1.getBoolean1());
        assertEquals(Optional.empty(), fv1.getInteger1());
        assertEquals(Optional.empty(), fv1.getString1());
        assertEquals(Optional.empty(), fv1.getLong2());
        assertEquals(Optional.of(3.16f), fv1.getFloat2());
        assertEquals(Optional.empty(), fv1.getBoolean2());
        assertEquals(Optional.empty(), fv1.getInteger2());
        assertEquals(Optional.empty(), fv1.getString2());
        assertEquals(Optional.empty(), fv1.getOffset());
        fv1.setBoolean2(false);
        assertEquals(Optional.empty(), fv1.getLong1());
        assertEquals(Optional.empty(), fv1.getFloat1());
        assertEquals(Optional.empty(), fv1.getBoolean1());
        assertEquals(Optional.empty(), fv1.getInteger1());
        assertEquals(Optional.empty(), fv1.getString1());
        assertEquals(Optional.empty(), fv1.getLong2());
        assertEquals(Optional.empty(), fv1.getFloat2());
        assertEquals(Optional.of(false), fv1.getBoolean2());
        assertEquals(Optional.empty(), fv1.getInteger2());
        assertEquals(Optional.empty(), fv1.getString2());
        assertEquals(Optional.empty(), fv1.getOffset());
        fv1.setInteger2(46);
        assertEquals(Optional.empty(), fv1.getLong1());
        assertEquals(Optional.empty(), fv1.getFloat1());
        assertEquals(Optional.empty(), fv1.getBoolean1());
        assertEquals(Optional.empty(), fv1.getInteger1());
        assertEquals(Optional.empty(), fv1.getString1());
        assertEquals(Optional.empty(), fv1.getLong2());
        assertEquals(Optional.empty(), fv1.getFloat2());
        assertEquals(Optional.empty(), fv1.getBoolean2());
        assertEquals(Optional.of(46), fv1.getInteger2());
        assertEquals(Optional.empty(), fv1.getString2());
        assertEquals(Optional.empty(), fv1.getOffset());
        fv1.setString2("def");
        assertEquals(Optional.empty(), fv1.getLong1());
        assertEquals(Optional.empty(), fv1.getFloat1());
        assertEquals(Optional.empty(), fv1.getBoolean1());
        assertEquals(Optional.empty(), fv1.getInteger1());
        assertEquals(Optional.empty(), fv1.getString1());
        assertEquals(Optional.empty(), fv1.getLong2());
        assertEquals(Optional.empty(), fv1.getFloat2());
        assertEquals(Optional.empty(), fv1.getBoolean2());
        assertEquals(Optional.empty(), fv1.getInteger2());
        assertEquals(Optional.of("def"), fv1.getString2());
        assertEquals(Optional.empty(), fv1.getOffset());
        fv1.setOffset(new Offset(new UUID(7, 8), 9));
        assertEquals(Optional.empty(), fv1.getLong1());
        assertEquals(Optional.empty(), fv1.getFloat1());
        assertEquals(Optional.empty(), fv1.getBoolean1());
        assertEquals(Optional.empty(), fv1.getInteger1());
        assertEquals(Optional.empty(), fv1.getString1());
        assertEquals(Optional.empty(), fv1.getLong2());
        assertEquals(Optional.empty(), fv1.getFloat2());
        assertEquals(Optional.empty(), fv1.getBoolean2());
        assertEquals(Optional.empty(), fv1.getInteger2());
        assertEquals(Optional.empty(), fv1.getString2());
        assertEquals(Optional.of(new Offset(new UUID(7, 8), 9)),
                     fv1.getOffset());
        fv1.setFloat1(3.14f);
        assertEquals(Optional.empty(), fv1.getLong1());
        assertEquals(Optional.of(3.14f), fv1.getFloat1());
        assertEquals(Optional.empty(), fv1.getBoolean1());
        assertEquals(Optional.empty(), fv1.getInteger1());
        assertEquals(Optional.empty(), fv1.getString1());
        assertEquals(Optional.empty(), fv1.getLong2());
        assertEquals(Optional.empty(), fv1.getFloat2());
        assertEquals(Optional.empty(), fv1.getBoolean2());
        assertEquals(Optional.empty(), fv1.getInteger2());
        assertEquals(Optional.empty(), fv1.getString2());
        assertEquals(Optional.empty(), fv1.getOffset());

        BarVariant11 fv2 = BarVariant11.ofFloat1(3.14f);
        assertEquals(Optional.empty(), fv2.getLong1());
        assertEquals(Optional.of(3.14f), fv2.getFloat1());
        assertEquals(Optional.empty(), fv2.getBoolean1());
        assertEquals(Optional.empty(), fv2.getInteger1());
        assertEquals(Optional.empty(), fv2.getString1());
        assertEquals(Optional.empty(), fv2.getLong2());
        assertEquals(Optional.empty(), fv2.getFloat2());
        assertEquals(Optional.empty(), fv2.getBoolean2());
        assertEquals(Optional.empty(), fv2.getInteger2());
        assertEquals(Optional.empty(), fv2.getString2());
        assertEquals(Optional.empty(), fv2.getOffset());
        assertEquals(fv1, fv2);

        BarVariant11 fv3 = BarVariant11.ofBoolean1(false);
        assertEquals(Optional.empty(), fv3.getLong1());
        assertEquals(Optional.empty(), fv3.getFloat1());
        assertEquals(Optional.of(false), fv3.getBoolean1());
        assertEquals(Optional.empty(), fv3.getInteger1());
        assertEquals(Optional.empty(), fv3.getString1());
        assertEquals(Optional.empty(), fv3.getLong2());
        assertEquals(Optional.empty(), fv3.getFloat2());
        assertEquals(Optional.empty(), fv3.getBoolean2());
        assertEquals(Optional.empty(), fv3.getInteger2());
        assertEquals(Optional.empty(), fv3.getString2());
        assertEquals(Optional.empty(), fv3.getOffset());

        BarVariant11 fv4 = BarVariant11.ofInteger1(47);
        assertEquals(Optional.empty(), fv4.getLong1());
        assertEquals(Optional.empty(), fv4.getFloat1());
        assertEquals(Optional.empty(), fv4.getBoolean1());
        assertEquals(Optional.of(47), fv4.getInteger1());
        assertEquals(Optional.empty(), fv4.getString1());
        assertEquals(Optional.empty(), fv4.getLong2());
        assertEquals(Optional.empty(), fv4.getFloat2());
        assertEquals(Optional.empty(), fv4.getBoolean2());
        assertEquals(Optional.empty(), fv4.getInteger2());
        assertEquals(Optional.empty(), fv4.getString2());
        assertEquals(Optional.empty(), fv4.getOffset());

        BarVariant11 fv5 = BarVariant11.ofString1("ghi");
        assertEquals(Optional.empty(), fv5.getLong1());
        assertEquals(Optional.empty(), fv5.getFloat1());
        assertEquals(Optional.empty(), fv5.getBoolean1());
        assertEquals(Optional.empty(), fv5.getInteger1());
        assertEquals(Optional.of("ghi"), fv5.getString1());
        assertEquals(Optional.empty(), fv5.getLong2());
        assertEquals(Optional.empty(), fv5.getFloat2());
        assertEquals(Optional.empty(), fv5.getBoolean2());
        assertEquals(Optional.empty(), fv5.getInteger2());
        assertEquals(Optional.empty(), fv5.getString2());
        assertEquals(Optional.empty(), fv5.getOffset());

        BarVariant11 fv6 = BarVariant11.ofLong2(48L);
        assertEquals(Optional.empty(), fv6.getLong1());
        assertEquals(Optional.empty(), fv6.getFloat1());
        assertEquals(Optional.empty(), fv6.getBoolean1());
        assertEquals(Optional.empty(), fv6.getInteger1());
        assertEquals(Optional.empty(), fv6.getString1());
        assertEquals(Optional.of(48L), fv6.getLong2());
        assertEquals(Optional.empty(), fv6.getFloat2());
        assertEquals(Optional.empty(), fv6.getBoolean2());
        assertEquals(Optional.empty(), fv6.getInteger2());
        assertEquals(Optional.empty(), fv6.getString2());
        assertEquals(Optional.empty(), fv6.getOffset());

        BarVariant11 fv7 = BarVariant11.ofFloat2(3.17f);
        assertEquals(Optional.empty(), fv7.getLong1());
        assertEquals(Optional.empty(), fv7.getFloat1());
        assertEquals(Optional.empty(), fv7.getBoolean1());
        assertEquals(Optional.empty(), fv7.getInteger1());
        assertEquals(Optional.empty(), fv7.getString1());
        assertEquals(Optional.empty(), fv7.getLong2());
        assertEquals(Optional.of(3.17f), fv7.getFloat2());
        assertEquals(Optional.empty(), fv7.getBoolean2());
        assertEquals(Optional.empty(), fv7.getInteger2());
        assertEquals(Optional.empty(), fv7.getString2());
        assertEquals(Optional.empty(), fv7.getOffset());

        BarVariant11 fv8 = BarVariant11.ofBoolean2(true);
        assertEquals(Optional.empty(), fv8.getLong1());
        assertEquals(Optional.empty(), fv8.getFloat1());
        assertEquals(Optional.empty(), fv8.getBoolean1());
        assertEquals(Optional.empty(), fv8.getInteger1());
        assertEquals(Optional.empty(), fv8.getString1());
        assertEquals(Optional.empty(), fv8.getLong2());
        assertEquals(Optional.empty(), fv8.getFloat2());
        assertEquals(Optional.of(true), fv8.getBoolean2());
        assertEquals(Optional.empty(), fv8.getInteger2());
        assertEquals(Optional.empty(), fv8.getString2());
        assertEquals(Optional.empty(), fv8.getOffset());

        BarVariant11 fv9 = BarVariant11.ofInteger2(49);
        assertEquals(Optional.empty(), fv9.getLong1());
        assertEquals(Optional.empty(), fv9.getFloat1());
        assertEquals(Optional.empty(), fv9.getBoolean1());
        assertEquals(Optional.empty(), fv9.getInteger1());
        assertEquals(Optional.empty(), fv9.getString1());
        assertEquals(Optional.empty(), fv9.getLong2());
        assertEquals(Optional.empty(), fv9.getFloat2());
        assertEquals(Optional.empty(), fv9.getBoolean2());
        assertEquals(Optional.of(49), fv9.getInteger2());
        assertEquals(Optional.empty(), fv9.getString2());
        assertEquals(Optional.empty(), fv9.getOffset());

        BarVariant11 fv10 = BarVariant11.ofString2("jkl");
        assertEquals(Optional.empty(), fv10.getLong1());
        assertEquals(Optional.empty(), fv10.getFloat1());
        assertEquals(Optional.empty(), fv10.getBoolean1());
        assertEquals(Optional.empty(), fv10.getInteger1());
        assertEquals(Optional.empty(), fv10.getString1());
        assertEquals(Optional.empty(), fv10.getLong2());
        assertEquals(Optional.empty(), fv10.getFloat2());
        assertEquals(Optional.empty(), fv10.getBoolean2());
        assertEquals(Optional.empty(), fv10.getInteger2());
        assertEquals(Optional.of("jkl"), fv10.getString2());
        assertEquals(Optional.empty(), fv10.getOffset());

        BarVariant11 fv11 =
            BarVariant11.ofOffset(new Offset(new UUID(21, 22), 23));
        assertEquals(Optional.empty(), fv11.getLong1());
        assertEquals(Optional.empty(), fv11.getFloat1());
        assertEquals(Optional.empty(), fv11.getBoolean1());
        assertEquals(Optional.empty(), fv11.getInteger1());
        assertEquals(Optional.empty(), fv11.getString1());
        assertEquals(Optional.empty(), fv11.getLong2());
        assertEquals(Optional.empty(), fv11.getFloat2());
        assertEquals(Optional.empty(), fv11.getBoolean2());
        assertEquals(Optional.empty(), fv11.getInteger2());
        assertEquals(Optional.empty(), fv11.getString2());
        assertEquals(Optional.of(new Offset(new UUID(21, 22), 23)),
                     fv11.getOffset());
    }
}


================================================
FILE: proto/AuxData.proto
================================================
//===- AuxData.proto ------------------------------------------*- Proto -*-===//
//
//  Copyright (C) 2020 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
syntax = "proto3";
package gtirb.proto;
option java_package = "com.grammatech.gtirb.proto";

message AuxData {
  string type_name = 1;
  bytes data = 2;
}


================================================
FILE: proto/ByteInterval.proto
================================================
//===- ByteInterval.proto -------------------------------------*- Proto -*-===//
//
//  Copyright (C) 2020 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
syntax = "proto3";
package gtirb.proto;
option java_package = "com.grammatech.gtirb.proto";

import "CodeBlock.proto";
import "DataBlock.proto";
import "SymbolicExpression.proto";

message Block {
  uint64 offset = 1;
  oneof value {
    CodeBlock code = 2;
    DataBlock data = 3;
  }
}

message ByteInterval {
  bytes uuid = 1;
  repeated Block blocks = 2;
  map<uint64, SymbolicExpression> symbolic_expressions = 3;
  bool has_address = 4;
  uint64 address = 5;
  uint64 size = 6;
  bytes contents = 7;
}


================================================
FILE: proto/CFG.proto
================================================
//===- CFG.proto ----------------------------------------------*- Proto -*-===//
//
//  Copyright (C) 2020 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
syntax = "proto3";
package gtirb.proto;
option java_package = "com.grammatech.gtirb.proto";

enum EdgeType {
  Type_Branch = 0;
  Type_Call = 1;
  Type_Fallthrough = 2;
  Type_Return = 3;
  Type_Syscall = 4;
  Type_Sysret = 5;
}

message EdgeLabel {
  bool conditional = 1;
  bool direct = 2;
  EdgeType type = 3;
}

message Edge {
  reserved 3, 4;
  reserved "boolean", "integer";

  bytes source_uuid = 1;
  bytes target_uuid = 2;
  EdgeLabel label = 5;
}

message CFG {
  reserved 1;
  reserved "blocks";

  repeated bytes vertices = 3;
  repeated Edge edges = 2;
}


================================================
FILE: proto/CMakeLists.txt
================================================
# GTIRB_PROTO_DIR
#
# Directory containing the default *.proto files.

set(GTIRB_PROTO_DIR
    ${CMAKE_CURRENT_SOURCE_DIR}
    PARENT_SCOPE
)

# GTIRB_PROTO_FILES
#
# List of *.proto definition files.

file(GLOB GTIRB_PROTO_FILES ${CMAKE_CURRENT_SOURCE_DIR}/*.proto)
set(GTIRB_PROTO_FILES
    ${GTIRB_PROTO_FILES}
    PARENT_SCOPE
)


================================================
FILE: proto/CodeBlock.proto
================================================
//===- CodeBlock.proto ----------------------------------------*- Proto -*-===//
//
//  Copyright (C) 2020 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
syntax = "proto3";
package gtirb.proto;
option java_package = "com.grammatech.gtirb.proto";

enum DecodeMode {
  All_Default = 0;
  ARM_Thumb = 1;
};

message CodeBlock {
  reserved "address";
  reserved 2;

  bytes uuid = 1;
  uint64 size = 3;
  DecodeMode decode_mode = 4;
}


================================================
FILE: proto/DataBlock.proto
================================================
//===- DataBlock.proto ----------------------------------------*- Proto -*-===//
//
//  Copyright (C) 2020 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
syntax = "proto3";
package gtirb.proto;
option java_package = "com.grammatech.gtirb.proto";

message DataBlock {
  reserved "address";
  reserved 2;

  bytes uuid = 1;
  uint64 size = 3;
}


================================================
FILE: proto/IR.proto
================================================
//===- IR.proto -----------------------------------------------*- Proto -*-===//
//
//  Copyright (C) 2020 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
syntax = "proto3";
package gtirb.proto;
option java_package = "com.grammatech.gtirb.proto";

import "AuxData.proto";
import "CFG.proto";
import "Module.proto";

message IR {
  // slot 4 has been used for multiple fields in the past
  // (more specifically, main_module_id and aux_data_container),
  // which is a Protobuf compatibility violation, but explains why we
  // reserve more field names than field numbers.
  reserved "tables", "main_module_id", "aux_data_container";
  reserved 2, 4;

  bytes uuid = 1;
  repeated Module modules = 3;
  map<string, AuxData> aux_data = 5;
  uint32 version = 6;
  CFG cfg = 7;
}


================================================
FILE: proto/Module.proto
================================================
//===- Module.proto -------------------------------------------*- Proto -*-===//
//
//  Copyright (C) 2020 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
syntax = "proto3";
package gtirb.proto;
option java_package = "com.grammatech.gtirb.proto";

import "AuxData.proto";
import "ProxyBlock.proto";
import "Section.proto";
import "Symbol.proto";

enum FileFormat {
  Format_Undefined = 0;
  COFF = 1;
  ELF = 2;
  PE = 3;
  IdaProDb32 = 4;
  IdaProDb64 = 5;
  XCOFF = 6;
  MACHO = 7;
  RAW = 8;
};

enum ISA {
  ISA_Undefined = 0;
  IA32 = 1;
  PPC32 = 2;
  X64 = 3;
  ARM = 4;
  ValidButUnsupported = 5;
  PPC64 = 6;
  ARM64 = 7;
  MIPS32 = 8;
  MIPS64 = 9;
};

enum ByteOrder {
  ByteOrder_Undefined = 0;
  BigEndian = 1;
  LittleEndian = 2;
}

message Module {
  reserved "image_byte_map", "data", "symbolic_operands", "aux_data_container",
      "blocks", "cfg";
  reserved 8, 10, 11, 13, 14, 15;

  bytes uuid = 1;
  string binary_path = 2;
  uint64 preferred_addr = 3;
  int64 rebase_delta = 4;
  FileFormat file_format = 5;
  ISA isa = 6;
  string name = 7;
  repeated Symbol symbols = 9;
  repeated ProxyBlock proxies = 16;
  repeated Section sections = 12;
  map<string, AuxData> aux_data = 17;
  bytes entry_point = 18;
  ByteOrder byte_order = 19;
}


================================================
FILE: proto/Offset.proto
================================================
//===- Offset.proto -------------------------------------------*- Proto -*-===//
//
//  Copyright (C) 2020 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
syntax = "proto3";
package gtirb.proto;
option java_package = "com.grammatech.gtirb.proto";

message Offset {
  bytes element_id = 1;
  uint64 displacement = 2;
}


================================================
FILE: proto/ProxyBlock.proto
================================================
//===- ProxyBlock.proto ---------------------------------------*- Proto -*-===//
//
//  Copyright (C) 2020 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
syntax = "proto3";
package gtirb.proto;
option java_package = "com.grammatech.gtirb.proto";

message ProxyBlock { bytes uuid = 1; }


================================================
FILE: proto/Section.proto
================================================
//===- Section.proto ------------------------------------------*- Proto -*-===//
//
//  Copyright (C) 2020 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
syntax = "proto3";
package gtirb.proto;
option java_package = "com.grammatech.gtirb.proto";

import "ByteInterval.proto";

enum SectionFlag {
  Section_Undefined = 0;
  Readable = 1;
  Writable = 2;
  Executable = 3;
  Loaded = 4;
  Initialized = 5;
  ThreadLocal = 6;
}

message Section {
  reserved "address", "size";
  reserved 3, 4;

  bytes uuid = 1;
  string name = 2;
  repeated ByteInterval byte_intervals = 5;
  repeated SectionFlag section_flags = 6;
}


================================================
FILE: proto/Symbol.proto
================================================
//===- Symbol.proto -------------------------------------------*- Proto -*-===//
//
//  Copyright (C) 2020 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
syntax = "proto3";
package gtirb.proto;
option java_package = "com.grammatech.gtirb.proto";

message Symbol {
  reserved 4;
  reserved "storage_kind";

  bytes uuid = 1;
  oneof optional_payload {
    uint64 value = 2;
    bytes referent_uuid = 5;
  }
  string name = 3;
  bool at_end = 6;
}


================================================
FILE: proto/SymbolicExpression.proto
================================================
//===- SymbolicExpression.proto -------------------------------*- Proto -*-===//
//
//  Copyright (C) 2020 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
syntax = "proto3";
package gtirb.proto;
option java_package = "com.grammatech.gtirb.proto";

message SymStackConst {
  int32 offset = 1;
  bytes symbol_uuid = 2;
}

message SymAddrConst {
  int64 offset = 1;
  bytes symbol_uuid = 2;
}

message SymAddrAddr {
  int64 scale = 1;
  int64 offset = 2;
  bytes symbol1_uuid = 3;
  bytes symbol2_uuid = 4;
}

// NOTE:
// We do not generalize or otherwise unify relocation attributes across
// architectures and instead prefer an explicit mapping of attributes names
// to the labels used in the assembly of each architecture.
enum SymAttribute {
  // ELF
  GOT = 0;
  GOTPC = 1;
  GOTOFF = 2;
  GOTREL = 3;
  PLT = 4;
  PLTOFF = 5;
  PCREL = 6;
  SECREL = 7;
  TLS = 8;
  TLSGD = 9;
  TLSLD = 10;
  TLSLDM = 11;
  TLSCALL = 12;
  TLSDESC = 13;
  TPREL = 14;
  TPOFF = 15;
  DTPREL = 16;
  DTPOFF = 17;
  NTPOFF = 18;
  DTPMOD = 19;
  PAGE = 20;
  PAGEOFF = 21;
  CALL = 22;
  LO = 23;
  HI = 24;
  HIGHER = 25;
  HIGHEST = 26;

  // X86
  GOTNTPOFF = 1000;
  INDNTPOFF = 1001;

  // ARM
  G0 = 2001;
  G1 = 2002;
  G2 = 2003;
  G3 = 2004;
  UPPER16 = 2005;
  LOWER16 = 2006;
  LO12 = 2007;
  LO15 = 2008;
  LO14 = 2009;
  HI12 = 2010;
  HI21 = 2011;
  S = 2012;
  PG = 2013;
  NC = 2014;
  ABS = 2015;
  PREL = 2016;
  PREL31 = 2017;
  TARGET1 = 2018;
  TARGET2 = 2019;
  SBREL = 2020;
  TLSLDO = 2021;

  // MIPS
  HI16 = 3000;
  LO16 = 3001;
  GPREL = 3002;
  DISP = 3003;
  OFST = 3004;

  // PPC
  H = 4000;
  L = 4001;
  HA = 4002;
  HIGH = 4003;
  HIGHA = 4004;
  HIGHERA = 4005;
  HIGHESTA = 4006;
  TOCBASE = 4007;
  TOC = 4008;
  NOTOC = 4009;
}

message SymbolicExpression {
  reserved "stack_const";
  reserved 1;
  oneof value {
    SymAddrConst addr_const = 2;
    SymAddrAddr addr_addr = 3;
  }
  repeated SymAttribute attribute_flags = 4;
}


================================================
FILE: proto/v0/AuxData.proto
================================================
//===- AuxData.proto ------------------------------------------*- Proto -*-===//
//
//  Copyright (C) 2018 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
syntax = "proto3";
package protoV0;

message AuxData {
  string type_name = 1;
  bytes data = 2;
}


================================================
FILE: proto/v0/AuxDataContainer.proto
================================================
//===- AuxDataContainer.proto ---------------------------------*- Proto -*-===//
//
//  Copyright (C) 2018 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//

syntax = "proto3";
package protoV0;

import "AuxData.proto";

message AuxDataContainer { map<string, AuxData> aux_data = 1; }


================================================
FILE: proto/v0/Block.proto
================================================
//===- Block.proto --------------------------------------------*- Proto -*-===//
//
//  Copyright (C) 2018 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
syntax = "proto3";
package protoV0;

message Block {
  bytes uuid = 1;
  uint64 address = 2;
  uint64 size = 3;
  uint64 decode_mode = 4;
}


================================================
FILE: proto/v0/ByteMap.proto
================================================
//===- ByteMap.proto ------------------------------------------*- Proto -*-===//
//
//  Copyright (C) 2018 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
syntax = "proto3";
package protoV0;

message Region {
  uint64 address = 1;
  bytes data = 2;
}

message ByteMap { repeated Region regions = 1; }


================================================
FILE: proto/v0/CFG.proto
================================================
//===- CFG.proto ----------------------------------------------*- Proto -*-===//
//
//  Copyright (C) 2018 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
syntax = "proto3";
package protoV0;

enum EdgeType {
  Type_Branch = 0;
  Type_Call = 1;
  Type_Fallthrough = 2;
  Type_Return = 3;
  Type_Syscall = 4;
  Type_Sysret = 5;
}

message EdgeLabel {
  bool conditional = 1;
  bool direct = 2;
  EdgeType type = 3;
}

message Edge {
  reserved 3, 4;
  reserved "boolean", "integer";

  bytes source_uuid = 1;
  bytes target_uuid = 2;
  EdgeLabel label = 5;
}

message CFG {
  reserved 1;
  reserved "blocks";

  repeated bytes vertices = 3;
  repeated Edge edges = 2;
}


================================================
FILE: proto/v0/CMakeLists.txt
================================================
file(GLOB PROTO_FILES ${CMAKE_CURRENT_SOURCE_DIR}/*.proto)
set(PROTO_FILES
    ${PROTO_FILES}
    PARENT_SCOPE
)


================================================
FILE: proto/v0/DataObject.proto
================================================
//===- DataObject.proto ---------------------------------------*- Proto -*-===//
//
//  Copyright (C) 2018 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
syntax = "proto3";
package protoV0;

message DataObject {
  bytes uuid = 1;
  uint64 address = 2;
  uint64 size = 3;
}


================================================
FILE: proto/v0/IR.proto
================================================
//===- IR.proto -----------------------------------------------*- Proto -*-===//
//
//  Copyright (C) 2018 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
syntax = "proto3";
package protoV0;

import "AuxDataContainer.proto";
import "Module.proto";

message IR {
  bytes uuid = 1;
  repeated Module modules = 3;
  AuxDataContainer aux_data_container = 4;
}


================================================
FILE: proto/v0/ImageByteMap.proto
================================================
//===- ImageByteMap.proto -------------------------------------*- Proto -*-===//
//
//  Copyright (C) 2018 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
syntax = "proto3";
package protoV0;

import "ByteMap.proto";

message ImageByteMap {
  bytes uuid = 1;
  ByteMap byte_map = 2;
  uint64 addr_min = 3;
  uint64 addr_max = 4;
  uint64 base_address = 5;
  uint64 entry_point_address = 6;
}


================================================
FILE: proto/v0/Module.proto
================================================
//===- Module.proto -------------------------------------------*- Proto -*-===//
//
//  Copyright (C) 2018 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
syntax = "proto3";
package protoV0;

import "AuxDataContainer.proto";
import "Block.proto";
import "CFG.proto";
import "DataObject.proto";
import "ImageByteMap.proto";
import "ProxyBlock.proto";
import "Section.proto";
import "Symbol.proto";
import "SymbolicExpression.proto";

enum FileFormat {
  Format_Undefined = 0;
  COFF = 1;
  ELF = 2;
  PE = 3;
  IdaProDb32 = 4;
  IdaProDb64 = 5;
  XCOFF = 6;
  MACHO = 7;
  RAW = 8;
};

enum ISAID {
  ISA_Undefined = 0;
  IA32 = 1;
  PPC32 = 2;
  X64 = 3;
  ARM = 4;
  ValidButUnsupported = 5;
};

message Module {
  bytes uuid = 1;
  string binary_path = 2;
  uint64 preferred_addr = 3;
  int64 rebase_delta = 4;
  FileFormat file_format = 5;
  ISAID isa_id = 6;
  string name = 7;
  ImageByteMap image_byte_map = 8;
  repeated Symbol symbols = 9;
  CFG cfg = 10;
  repeated Block blocks = 15;
  repeated DataObject data = 11;
  repeated ProxyBlock proxies = 16;
  repeated Section sections = 12;
  map<uint64, SymbolicExpression> symbolic_operands = 13;
  AuxDataContainer aux_data_container = 14;
}


================================================
FILE: proto/v0/Offset.proto
================================================
//===- Offset.proto -------------------------------------------*- Proto -*-===//
//
//  Copyright (C) 2018 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
syntax = "proto3";
package protoV0;

message Offset {
  bytes element_id = 1;
  uint64 displacement = 2;
}


================================================
FILE: proto/v0/ProxyBlock.proto
================================================
//===- ProxyBlock.proto ---------------------------------------*- Proto -*-===//
//
//  Copyright (C) 2018 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
syntax = "proto3";
package protoV0;

message ProxyBlock { bytes uuid = 1; }


================================================
FILE: proto/v0/Section.proto
================================================
//===- Section.proto ------------------------------------------*- Proto -*-===//
//
//  Copyright (C) 2018 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
syntax = "proto3";
package protoV0;

message Section {
  bytes uuid = 1;
  string name = 2;
  uint64 address = 3;
  uint64 size = 4;
}


================================================
FILE: proto/v0/Symbol.proto
================================================
//===- Symbol.proto -------------------------------------------*- Proto -*-===//
//
//  Copyright (C) 2018 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
syntax = "proto3";
package protoV0;

enum StorageKind {
  Storage_Undefined = 0;
  Storage_Normal = 1;
  Storage_Static = 2;
  Storage_Extern = 3;
  Storage_Local = 4;
};

message Symbol {
  bytes uuid = 1;
  oneof optional_payload {
    uint64 value = 2;
    bytes referent_uuid = 5;
  }
  string name = 3;
  StorageKind storage_kind = 4;
}


================================================
FILE: proto/v0/SymbolicExpression.proto
================================================
//===- SymbolicExpression.proto -------------------------------*- Proto -*-===//
//
//  Copyright (C) 2018 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
syntax = "proto3";
package protoV0;

message SymStackConst {
  int32 offset = 1;
  bytes symbol_uuid = 2;
}

message SymAddrConst {
  int64 offset = 1;
  bytes symbol_uuid = 2;
}

message SymAddrAddr {
  int64 scale = 1;
  int64 offset = 2;
  bytes symbol1_uuid = 3;
  bytes symbol2_uuid = 4;
}

message SymbolicExpression {
  oneof value {
    SymStackConst stack_const = 1;
    SymAddrConst addr_const = 2;
    SymAddrAddr addr_addr = 3;
  }
}


================================================
FILE: python/CMakeLists.txt
================================================
if(GTIRB_ENABLE_MYPY)
  find_program(MYPY mypy)
  find_program(MYPY_PROTOBUF protoc-gen-mypy)
  if(MYPY AND MYPY_PROTOBUF)
    set(ENABLE_MYPY ON)
    set(MYPY_PROTOBUF_FLAGS --mypy_out=${CMAKE_CURRENT_BINARY_DIR})
    configure_file(mypy.ini.in mypy.ini @ONLY)
  else()
    set(ENABLE_MYPY OFF)
    if(NOT MYPY)
      message(
        WARNING "mypy not found. Type checking with mypy will be disabled."
      )
    endif()
    if(NOT MYPY_PROTOBUF)
      message(
        WARNING
          "protoc-gen-mypy not found. Type checking with mypy will be disabled."
      )
    endif()
  endif()
endif()

# Create a PEP 561 py.typed to let clients find the inline type annotations.
file(WRITE ${CMAKE_CURRENT_BINARY_DIR}/gtirb/py.typed "")

if("${Protobuf_VERSION}" VERSION_LESS "3.19.0")
  # Older protobuf compilers generate code incompatible with newer runtimes.
  set(GTIRB_PROTOBUF_CONSTRAINT "protobuf >= ${Protobuf_VERSION}, < 4.0")
else()
  set(GTIRB_PROTOBUF_CONSTRAINT "protobuf >= 4.0")
endif()

configure_file(pyproject.toml.in pyproject.toml @ONLY)
configure_file(README.md README COPYONLY)
configure_file(requirements-dev.txt requirements-dev.txt COPYONLY)
configure_file(requirements-mypy.txt requirements-mypy.txt COPYONLY)
configure_file(tox.ini tox.ini COPYONLY)
# Copy the license from the top-level of the source repo.
configure_file(${CMAKE_SOURCE_DIR}/LICENSE.txt LICENSE COPYONLY)

# ---------------------------------------------------------------------------
# Building the gtirb protobuf files into python
# ---------------------------------------------------------------------------

set(PROTO_PY_DIR ${CMAKE_CURRENT_BINARY_DIR}/gtirb/proto)

# Rewrite the proto definitions to use paths when including other definitions.
# We do this instead of using the one-line configure_file() command so that the
# proto/*.proto files in the source directory do not need to be rewritten for
# the CL API.

foreach(GTIRB_PROTO_FILE ${GTIRB_PROTO_FILES})
  get_filename_component(PROTO_BASE ${GTIRB_PROTO_FILE} NAME_WE)
  set(PROTO_PY_OUT "${PROTO_PY_DIR}/${PROTO_BASE}.proto")
  file(READ ${GTIRB_PROTO_FILE} PROTO_DEF_STR)
  string(REGEX REPLACE "import \"" "import \"gtirb/proto/" PROTO_DEF_STR
                       "${PROTO_DEF_STR}"
  )
  file(WRITE ${PROTO_PY_OUT} "${PROTO_DEF_STR}")

  set(PROTO_PY_SOURCE "${PROTO_PY_DIR}/${PROTO_BASE}_pb2.py")
  add_custom_command(
    OUTPUT "${PROTO_PY_SOURCE}"
    COMMAND
      protobuf::protoc --python_out ${CMAKE_CURRENT_BINARY_DIR}
      ${MYPY_PROTOBUF_FLAGS} -I "${CMAKE_CURRENT_BINARY_DIR}" ${PROTO_PY_OUT}
    DEPENDS ${PROTO_PY_OUT} protobuf::protoc
    VERBATIM
  )
  list(APPEND PROTO_PY_SOURCES "${PROTO_PY_SOURCE}")
endforeach()
add_custom_target(py-proto DEPENDS ${PROTO_PY_SOURCES})

# existing Python files
file(GLOB PY_SOURCES ${CMAKE_CURRENT_SOURCE_DIR}/gtirb/*.py
     ${CMAKE_CURRENT_SOURCE_DIR}/tests/*.py
)

add_custom_target(pygtirb ALL DEPENDS ${PY_SOURCES} py-proto)
add_custom_command(
  TARGET pygtirb
  COMMAND ${CMAKE_COMMAND} -E make_directory "${CMAKE_CURRENT_BINARY_DIR}/gtirb"
          "${CMAKE_CURRENT_BINARY_DIR}/tests"
  COMMAND ${CMAKE_COMMAND} -E copy_directory "${CMAKE_CURRENT_SOURCE_DIR}/gtirb"
          "${CMAKE_CURRENT_BINARY_DIR}/gtirb"
  COMMAND ${CMAKE_COMMAND} -E copy_directory
          "${CMAKE_CURRENT_SOURCE_DIR}/tests"
          "${CMAKE_CURRENT_BINARY_DIR}/tests"
)

if(GTIRB_RELEASE_VERSION)
  set(GTIRB_PYTHON_DEV_SUFFIX "")
else()
  set(GTIRB_PYTHON_DEV_SUFFIX ".dev")
endif()

configure_file(
  ${CMAKE_CURRENT_SOURCE_DIR}/version.py.in
  ${CMAKE_CURRENT_BINARY_DIR}/gtirb/version.py @ONLY
)

if(GTIRB_ENABLE_TESTS)
  find_program(TOX tox)
  if(TOX)
    if(ENABLE_MYPY)
      # Only run mypy if we actually generated stubs for the protobuf
      # definitions.
      add_test(
        NAME mypy
        COMMAND tox run -e mypy
        WORKING_DIRECTORY "${CMAKE_CURRENT_BINARY_DIR}/"
      )
    endif()

    if(ENABLE_CODE_COVERAGE)
      set(GTIRB_TOX_FLAGS)
    else()
      set(GTIRB_TOX_FLAGS "--")
    endif()
    execute_process(
      COMMAND ${TOX} -l
      WORKING_DIRECTORY ${CMAKE_CURRENT_SOURCE_DIR}
      OUTPUT_VARIABLE TOX_ENVIRONMENTS
    )
    string(REGEX MATCHALL "py3[0-9a-z-]*" TOX_ENVIRONMENTS ${TOX_ENVIRONMENTS})
    foreach(TOX_ENVIRONMENT ${TOX_ENVIRONMENTS})
      add_test(
        NAME ${TOX_ENVIRONMENT}
        COMMAND ${TOX} run -e ${TOX_ENVIRONMENT} ${GTIRB_TOX_FLAGS}
        WORKING_DIRECTORY ${CMAKE_CURRENT_BINARY_DIR}
      )
    endforeach()
  else()
    message(SEND_ERROR "Python tests require tox to be installed")
  endif()
endif()

# Convenience targets for installing python
add_custom_target(
  python-wheel
  DEPENDS pygtirb
  COMMAND "${PYTHON}" -m pip wheel --no-deps "${CMAKE_CURRENT_BINARY_DIR}"
)


================================================
FILE: python/README.md
================================================
Python library for GTIRB.


================================================
FILE: python/gtirb/__init__.py
================================================
__all__ = [
    "AuxData",
    "AuxDataContainer",
    "Block",
    "ByteBlock",
    "ByteInterval",
    "CFG",
    "CfgNode",
    "CodeBlock",
    "DataBlock",
    "Edge",
    "EdgeLabel",
    "EdgeType",
    "IR",
    "Module",
    "Node",
    "Offset",
    "ProxyBlock",
    "Section",
    "Serialization",
    "Symbol",
    "SymbolicExpression",
    "SymAddrAddr",
    "SymAddrConst",
    "Variant",
]

from .auxdata import AuxData, AuxDataContainer
from .block import Block, ByteBlock, CfgNode, CodeBlock, DataBlock, ProxyBlock
from .byteinterval import ByteInterval
from .cfg import CFG, Edge, EdgeLabel, EdgeType
from .ir import IR
from .module import Module
from .node import Node
from .offset import Offset
from .section import Section
from .serialization import Serialization, Variant
from .symbol import Symbol
from .symbolicexpression import SymAddrAddr, SymAddrConst, SymbolicExpression
from .version import API_VERSION

__version__ = API_VERSION


================================================
FILE: python/gtirb/auxdata.py
================================================
from io import BytesIO
from typing import TYPE_CHECKING, Any, Callable, ClassVar, Dict, Optional
from uuid import UUID

from google.protobuf.internal.containers import MessageMap

from .node import Node
from .proto import AuxData_pb2
from .serialization import Serialization
from .util import DictLike

if TYPE_CHECKING:  # pragma: no cover
    # Ignore flake8 "imported but unused" errors.
    from .ir import IR  # noqa: F401


class _LazyDataContainer:
    """
    Container that holds the raw byte stream until it is read, then releases
    it. If it is never read, then serialization skips re-encoding (and
    deserializing) the data.
    """

    def __init__(
        self,
        raw_data: bytes,
        type_name: str,
        get_by_uuid: Callable[[UUID], Optional[Node]],
    ):
        self.raw_data: Optional[bytes] = raw_data
        self.type_name = type_name
        self.get_by_uuid = get_by_uuid

    def get_data(self) -> object:
        """
        Get any pending still-serialized data, or return the passed data
        instead (the default).
        """
        assert self.raw_data is not None
        rv = AuxData.serializer.decode(
            self.raw_data, self.type_name, self.get_by_uuid
        )
        self.raw_data = None
        return rv

    def get_raw_data(self) -> bytes:
        """ """
        assert self.raw_data is not None
        return self.raw_data


class AuxData:
    """AuxData objects can be attached to the :class:`gtirb.IR` or individual
    :class:`gtirb.Module` s to store additional client-specific data in a
    portable way.

    AuxData represents a portable, language-independent manner of encoding
    rich data. To do this, all data is stored on disk as a series of bytes
    with a string describing the format of the data, called a *type name*. See
    :mod:`gtirb.serialization` for the list of all default types. Types may
    also be parameterized; for example, ``mapping<string,UUID>`` is a ``dict``
    from ``str`` objects to ``UUID`` objects. All ``AuxData`` requires
    a valid type name in order to be serialized.

    :ivar ~.data: The value stored in this AuxData.
    :ivar ~.type_name: A string describing the type of ``data``.
        Used to determine the proper codec for serializing this AuxData.
    """

    serializer: ClassVar[Serialization] = Serialization()
    """This is a :class:`gtirb.Serialization` instance, used to
    encode and decode ``data`` fields of all ``AuxData``. See
    :mod:`gtirb.serialization` for details.
    """

    def __init__(
        self,
        data: object,
        type_name: str,
        lazy_container: Optional[_LazyDataContainer] = None,
    ):
        """
        :param data: The value stored in this AuxData.
        :param type_name: A string describing the type of ``data``.
            Used to determine the proper codec for serializing this AuxData.
        :param lazy_container: An object that will lazily deserialize the
            auxdata table backing this object, or None.
        """
        self._lazy_container = lazy_container
        # _data has type Any to avoid disrupting clients want to type check
        # their use of gtirb. If _data had type object, they would have to
        # verify the element types of potentially large containers, or else
        # just subvert the type system by casting anyway.
        self._data: Any = data  # type: ignore[misc]
        self.type_name = type_name

    @property
    def data(self) -> Any:  # type: ignore[misc]
        if self._lazy_container is not None:
            self._data = self._lazy_container.get_data()
            self._lazy_container = None
        return self._data

    @data.setter
    def data(self, value: object) -> None:
        self._data = value
        self._lazy_container = None

    @classmethod
    def _from_protobuf(
        cls,
        aux_data: AuxData_pb2.AuxData,
        ir: Optional["IR"],
    ) -> "AuxData":
        """Deserialize AuxData from Protobuf. Lazy, will not perform
        deserialization until .data is accessed.

        :param aux_data: The Protobuf AuxData object.
        """

        # Defer deserialization until someone accesses .data
        assert ir
        lazy_container = _LazyDataContainer(
            aux_data.data, aux_data.type_name, ir.get_by_uuid
        )
        return cls(
            data=None,
            type_name=aux_data.type_name,
            lazy_container=lazy_container,
        )

    def _to_protobuf(self) -> AuxData_pb2.AuxData:
        """Get a Protobuf representation of the AuxData."""

        proto_auxdata = AuxData_pb2.AuxData()
        proto_auxdata.type_name = self.type_name
        # If we are serializing the same data, and the way that data is encoded
        # has not changed, then just use the already serialized copy.
        if self._lazy_container is not None and (
            self.type_name == self._lazy_container.type_name
        ):
            proto_auxdata.data = self._lazy_container.get_raw_data()
        else:
            data_stream = BytesIO()
            AuxData.serializer.encode(data_stream, self.data, self.type_name)
            proto_auxdata.data = data_stream.getvalue()
        return proto_auxdata

    def __repr__(self) -> str:
        return (
            "AuxData("
            "type_name={type_name!r}, "
            "data={data!r}, "
            ")".format(type_name=self.type_name, data=self.data)
        )


class AuxDataContainer(Node):
    """The base class for anything that holds AuxData tables; that is,
    :class:`gtirb.IR` and :class:`gtirb.Module`.

    :ivar ~.aux_data: The auxiliary data associated
            with the object, as a mapping from names to
            :class:`gtirb.AuxData`.
    """

    def __init__(
        self,
        aux_data: DictLike[str, AuxData] = {},
        uuid: Optional[UUID] = None,
    ):
        """
        :param aux_data: The initial auxiliary data to be associated
            with the object, as a mapping from names to
            :class:`gtirb.AuxData`. Defaults to an empty :class:`dict`.
        :param uuid: the UUID of this ``AuxDataContainer``,
            or None if a new UUID needs generated via :func:`uuid.uuid4`.
            Defaults to None.
        """
        super().__init__(uuid)
        self.aux_data: Dict[str, AuxData] = dict(aux_data)

    @classmethod
    def _read_protobuf_aux_data(
        cls,
        proto_container: "MessageMap[str, AuxData_pb2.AuxData]",
        ir: Optional["IR"],
    ) -> Dict[str, AuxData]:
        """
        Instead of the overrided _decode_protobuf, this method requires the
        Protobuf message to read from. AuxDataContainers need to call this
        method in their own _decode_protobuf overrides.

        :param proto_container: A Protobuf message with a field called
            ``aux_data``.
        """
        return {
            key: AuxData._from_protobuf(val, ir)
            for key, val in proto_container.items()
        }

    def _write_protobuf_aux_data(
        self, proto_container: "MessageMap[str, AuxData_pb2.AuxData]"
    ) -> None:
        """
        Instead of the overrided _to_protobuf, this method requires the
        Protobuf message to write into. AuxDataContainers need to call this
        method in their own _to_protobuf overrides.

        :param proto_container: A Protobuf message with a field called
            ``aux_data``.
        """
        for k, v in self.aux_data.items():
            proto_container[k].CopyFrom(v._to_protobuf())

    def deep_eq(self, other: object) -> bool:
        """This overrides :func:`gtirb.Node.deep_eq` to check for
        AuxData equality.

        Because the values stored by AuxData are not necessarily
        amenable to deep checking, the auxiliary data dictionaries
        stored for ``self`` and ``other`` are not deeply checked. Instead,
        they are considered to be equal if their sets of keys are equal.
        """

        if not isinstance(other, AuxDataContainer):
            return False
        if (
            self.uuid != other.uuid
            or self.aux_data.keys() != other.aux_data.keys()
        ):
            return False
        return True


================================================
FILE: python/gtirb/block.py
================================================
import typing
from enum import Enum
from uuid import UUID

from .node import Node, _NodeMessage
from .proto import CodeBlock_pb2, DataBlock_pb2, ProxyBlock_pb2
from .util import _IndexedAttribute

if typing.TYPE_CHECKING:  # pragma: no cover
    # Ignore flake8 "imported but unused" errors.
    from .byteinterval import ByteInterval  # noqa: F401
    from .cfg import Edge  # noqa: F401
    from .ir import IR  # noqa: F401
    from .module import Module  # noqa: F401
    from .section import Section  # noqa: F401
    from .symbol import Symbol  # noqa: F401


class Block(Node):
    """The base class for blocks. Symbols may have references to any subclass
    of Block.
    """

    @property
    def module(self) -> typing.Optional["Module"]:
        """Get the module this node ultimately belongs to."""

        raise NotImplementedError  # pragma: no cover

    @property
    def references(self) -> typing.Iterator["Symbol"]:
        """Get all the symbols that refer to this block."""

        if not self.module:
            return

        symbol_set = self.module._symbol_referent_index.get(self)
        if symbol_set:
            yield from symbol_set

    def _add_to_uuid_cache(self, cache: typing.Dict[UUID, Node]) -> None:
        """Update the UUID cache when this node is added."""

        cache[self.uuid] = self

    def _remove_from_uuid_cache(self, cache: typing.Dict[UUID, Node]) -> None:
        """Update the UUID cache when this node is removed."""

        del cache[self.uuid]


class ByteBlock(Block):
    """The base class for blocks that belong to a :class:`ByteInterval` and
    store their bytes there.

    :ivar ~.size: The size of the block in bytes.
    :ivar ~.offset: The offset from the beginning of the byte interval to which
        this block belongs. Multiple blocks in the same interval may have the
        same offset.
    """

    size = _IndexedAttribute[int]()(lambda self: self.byte_interval)
    offset = _IndexedAttribute[int]()(lambda self: self.byte_interval)

    def __init__(
        self,
        *,
        size: int = 0,
        offset: int = 0,
        uuid: typing.Optional[UUID] = None,
        byte_interval: typing.Optional["ByteInterval"] = None,
    ):
        """
        :param size: The size of the data object in bytes.
        :param offset: The offset from the beginning of the byte interval to
            which this block belongs.
        :param uuid: The UUID of this ``ByteBlock``,
            or None if a new UUID needs generated via :func:`uuid.uuid4`.
            Defaults to None.
        :param byte_interval: The :class:`ByteInterval` this block belongs to.
        """

        super().__init__(uuid=uuid)
        self._byte_interval: typing.Optional["ByteInterval"] = None
        self.size = size
        self.offset = offset
        # Use the property setter to ensure correct invariants.
        self.byte_interval = byte_interval

    @property
    def byte_interval(self) -> typing.Optional["ByteInterval"]:
        """The :class:`ByteInterval` this block belongs to."""

        return self._byte_interval

    @byte_interval.setter
    def byte_interval(self, value: typing.Optional["ByteInterval"]) -> None:
        if self._byte_interval is not None:
            self._byte_interval.blocks.discard(self)
        if value is not None:
            value.blocks.add(self)

    def deep_eq(self, other: object) -> bool:
        # Do not move __eq__. See docstring for Node.deep_eq for more info.
        if not isinstance(other, ByteBlock):
            return False
        return (
            self.offset == other.offset
            and self.uuid == other.uuid
            and self.size == other.size
        )

    @property
    def contents(self) -> bytes:
        """Get the bytes in this block."""

        if self.byte_interval is None:
            return b""
        return self.byte_interval.contents[
            self.offset : self.offset + self.size
        ]

    @property
    def address(self) -> typing.Optional[int]:
        """Get the address of this block, or None if not present."""

        if self.byte_interval is None or self.byte_interval.address is None:
            return None
        return self.byte_interval.address + self.offset

    @property
    def section(self) -> typing.Optional["Section"]:
        """Get the section this node ultimately belongs to."""
        byte_interval = self.byte_interval
        if byte_interval is None:
            return None
        return byte_interval.section

    @property
    def module(self) -> typing.Optional["Module"]:
        """Get the module this node ultimately belongs to."""
        section = self.section
        if section is None:
            return None
        return section.module

    @property
    def ir(self) -> typing.Optional["IR"]:
        """Get the IR this node ultimately belongs to."""
        module = self.module
        if module is None:
            return None
        return module.ir

    def contains_offset(self, offset: int) -> bool:
        """Indicate if the provided offset is within this block."""
        return self.offset <= offset < (self.offset + self.size)

    def contains_address(self, address: int) -> bool:
        """Indicate if the provided address is within this block.
        Returns False if the block has no address.
        """
        byte_interval = self.byte_interval
        if byte_interval is not None:
            base = byte_interval.address
            if base is not None:
                return self.contains_offset(address - base)
        return False


class CfgNode(Block):
    """The base class for blocks that may appear as vertices in the CFG."""

    @property
    def incoming_edges(self) -> typing.Iterable["Edge"]:
        """Get the edges that point to this CFG node."""

        raise NotImplementedError  # pragma: no cover

    @property
    def outgoing_edges(self) -> typing.Iterable["Edge"]:
        """Get the edges that start at this CFG node."""

        raise NotImplementedError  # pragma: no cover


class DataBlock(ByteBlock):
    """Represents a data object, possibly symbolic."""

    def __init__(
        self,
        *,
        size: int = 0,
        offset: int = 0,
        uuid: typing.Optional[UUID] = None,
        byte_interval: typing.Optional["ByteInterval"] = None,
    ):
        """
        :param size: The size of the data object in bytes.
        :param offset: The offset from the beginning of the byte interval to
            which this block belongs.
        :param uuid: The UUID of this ``DataBlock``,
            or None if a new UUID needs generated via :func:`uuid.uuid4`.
            Defaults to None.
        :param byte_interval: The :class:`ByteInterval` this block belongs to.
        """

        super().__init__(
            size=size, offset=offset, uuid=uuid, byte_interval=byte_interval
        )

    @classmethod
    def _decode_protobuf(
        cls,
        proto_dataobject: _NodeMessage,
        uuid: UUID,
        ir: typing.Optional["IR"],
    ) -> "DataBlock":
        assert ir
        assert isinstance(proto_dataobject, DataBlock_pb2.DataBlock)
        b = cls(size=proto_dataobject.size, uuid=uuid)
        b._add_to_uuid_cache(ir._local_uuid_cache)
        return b

    def _to_protobuf(self) -> DataBlock_pb2.DataBlock:
        proto_dataobject = DataBlock_pb2.DataBlock()
        proto_dataobject.uuid = self.uuid.bytes
        proto_dataobject.size = self.size
        return proto_dataobject

    def __repr__(self) -> str:
        return (
            "DataBlock("
            "uuid={uuid!r}, "
            "size={size}, "
            "offset={offset}, "
            ")".format(uuid=self.uuid, size=self.size, offset=self.offset)
        )


class CodeBlock(ByteBlock, CfgNode):
    """A basic block in the binary.

    Does not directly store data bytes, which are kept in a
    :class:`ByteInterval`.

    :ivar ~.decode_mode: The decode mode of the block,
        used in some ISAs to differentiate between sub-ISAs
        (e.g. differentiating blocks written in ARM and Thumb).
    """

    class DecodeMode(Enum):
        """Variations on decoding a particular ISA"""

        Default = CodeBlock_pb2.DecodeMode.Value("All_Default")
        """Default decode mode for all ISAs"""

        Thumb = CodeBlock_pb2.DecodeMode.Value("ARM_Thumb")
        """Thumb decode mode for ARM32"""

    def __init__(
        self,
        *,
        decode_mode: DecodeMode = DecodeMode.Default,
        size: int = 0,
        offset: int = 0,
        uuid: typing.Optional[UUID] = None,
        byte_interval: typing.Optional["ByteInterval"] = None,
    ):
        """
        :param size: The length of the block in bytes.
        :param decode_mode: The decode mode of the block,
            used in some ISAs to differentiate between sub-ISAs
            (e.g. differentiating blocks written in ARM and Thumb).
            Defaults to DecodeMode.Default.
        :param offset: The offset from the beginning of the byte interval to
            which this block belongs.
        :param uuid: The UUID of this ``CodeBlock``,
            or None if a new UUID needs generated via :func:`uuid.uuid4`.
            Defaults to None.
        :param byte_interval: The :class:`ByteInterval` this block belongs to.
        """

        super().__init__(
            size=size, offset=offset, uuid=uuid, byte_interval=byte_interval
        )
        self.decode_mode = decode_mode  # type: CodeBlock.DecodeMode

    @classmethod
    def _decode_protobuf(
        cls,
        proto_block: _NodeMessage,
        uuid: UUID,
        ir: typing.Optional["IR"],
    ) -> "CodeBlock":
        assert ir
        assert isinstance(proto_block, CodeBlock_pb2.CodeBlock)
        b = cls(
            decode_mode=cls.DecodeMode(proto_block.decode_mode),
            size=proto_block.size,
            uuid=uuid,
        )
        b._add_to_uuid_cache(ir._local_uuid_cache)
        return b

    def _to_protobuf(self) -> CodeBlock_pb2.CodeBlock:
        proto_block = CodeBlock_pb2.CodeBlock()
        proto_block.uuid = self.uuid.bytes
        proto_block.size = self.size
        proto_block.decode_mode = self.decode_mode.value
        return proto_block

    def deep_eq(self, other: object) -> bool:
        # Do not move __eq__. See docstring for Node.deep_eq for more info.
        if not isinstance(other, CodeBlock):
            return False
        return super().deep_eq(other) and self.decode_mode == other.decode_mode

    def __repr__(self) -> str:
        return (
            "CodeBlock("
            "uuid={uuid!r}, "
            "size={size}, "
            "offset={offset}, "
            "decode_mode=CodeBlock.{decode_mode!s}, "
            ")".format(
                uuid=self.uuid,
                size=self.size,
                offset=self.offset,
                decode_mode=self.decode_mode,
            )
        )

    @property
    def incoming_edges(self) -> typing.Iterator["Edge"]:
        ir = self.ir
        if ir is None:
            return iter(())
        return ir.cfg.in_edges(self)

    @property
    def outgoing_edges(self) -> typing.Iterator["Edge"]:
        ir = self.ir
        if ir is None:
            return iter(())
        return ir.cfg.out_edges(self)


class ProxyBlock(CfgNode):
    """A placeholder that serves as the endpoint (source or target) of a
    :class:`gtirb.Edge`.

    ProxyBlock objects allow the construction of CFG edges to or from
    another node. For example, a call to a function in another module
    may be represented by a :class:`gtirb.Edge` that originates at the
    calling :class:`gtirb.CodeBlock` and targets a ProxyBlock. Another
    example would be a :class:`gtirb.Edge` that represents an indirect
    jump whose target is not known.

    A ProxyBlock does not represent any instructions and so has neither
    an address nor a size.
    """

    def __init__(
        self,
        *,
        uuid: typing.Optional[UUID] = None,
        module: typing.Optional["Module"] = None,
    ):
        super().__init__(uuid=uuid)
        self._module: typing.Optional["Module"] = None
        # Use the property setter to ensure correct invariants.
        self.module = module

    @classmethod
    def _decode_protobuf(
        cls,
        proto_proxy: _NodeMessage,
        uuid: UUID,
        ir: typing.Optional["IR"],
    ) -> "ProxyBlock":
        assert ir
        assert isinstance(proto_proxy, ProxyBlock_pb2.ProxyBlock)
        b = cls(uuid=uuid)
        b._add_to_uuid_cache(ir._local_uuid_cache)
        return b

    def _to_protobuf(self) -> ProxyBlock_pb2.ProxyBlock:
        proto_proxyblock = ProxyBlock_pb2.ProxyBlock()
        proto_proxyblock.uuid = self.uuid.bytes
        return proto_proxyblock

    def deep_eq(self, other: object) -> bool:
        # Do not move __eq__. See docstring for Node.deep_eq for more info.
        if not isinstance(other, ProxyBlock):
            return False
        return self.uuid == other.uuid

    def __repr__(self) -> str:
        return "ProxyBlock(" "uuid={uuid!r}, " ")".format(**self.__dict__)

    @property
    def module(self) -> typing.Optional["Module"]:
        return self._module

    @module.setter
    def module(self, value: typing.Optional["Module"]) -> None:
        if self._module is not None:
            self._module.proxies.discard(self)
        if value is not None:
            value.proxies.add(self)

    @property
    def incoming_edges(self) -> typing.Iterator["Edge"]:
        ir = self.ir
        if ir is None:
            return iter(())
        return ir.cfg.in_edges(self)

    @property
    def outgoing_edges(self) -> typing.Iterator["Edge"]:
        ir = self.ir
        if ir is None:
            return iter(())
        return ir.cfg.out_edges(self)

    @property
    def ir(self) -> typing.Optional["IR"]:
        """Get the IR this node ultimately belongs to."""
        module = self.module
        if module is None:
            return None
        return module.ir


================================================
FILE: python/gtirb/byteinterval.py
================================================
import typing
from uuid import UUID

from sortedcontainers import SortedDict

from .block import ByteBlock, CodeBlock, DataBlock
from .lazyintervaltree import LazyIntervalTree
from .node import Node, _NodeMessage
from .proto import ByteInterval_pb2, SymbolicExpression_pb2
from .symbolicexpression import SymAddrAddr, SymAddrConst, SymbolicExpression
from .util import (
    DictLike,
    DictWrapper,
    SetWrapper,
    _IndexedAttribute,
    _nodes_at_interval_tree,
    _nodes_at_interval_tree_offset,
    _nodes_on_interval_tree,
    _nodes_on_interval_tree_offset,
    _offset_interval,
    get_desired_range,
)

if typing.TYPE_CHECKING:  # pragma: no cover
    # Ignore flake8 "imported but unused" errors.
    from .ir import IR  # noqa: F401
    from .module import Module  # noqa: F401
    from .section import Section  # noqa: F401


SymbolicExpressionElement = typing.Tuple[
    "ByteInterval", int, SymbolicExpression
]


class ByteInterval(Node):
    """A contiguous region of bytes in a binary.

    A ByteInterval defines a relative ordering for a group of
    :class:`ByteBlock`\\s, optionally at a fixed address in memory. It also
    stores the bytes associated with these blocks.

    If two blocks are in two different ByteIntervals, then it should be
    considered safe (that is, preserving of program semantics) to move one
    block relative to the other in memory. If two blocks are in the same
    ByteInterval, then it should be considered unknown if moving the two blocks
    relative to one another in memory is a safe operation.

    :ivar ~.address: The fixed address of this interval, if present. If this
        field is present, it may indicate the original address at which this
        interval was located at in memory, or it may indicate that this block's
        address is fixed and must not be changed. If this field is not present,
        it indicates that the interval is free to be moved around in memory
        while preserving program semantics.
    :ivar ~.size: The size of this interval in bytes. If this number is greater
        than ``initialized_size``, this indicates that the high addresses taken
        up by this interval consist of uninitialized bytes. This often occurs
        in BSS sections, where data is zero-initialized rather than stored as
        zeroes in the binary.
    :ivar ~.contents: The bytes stored in this interval.
    :ivar ~.blocks: A set of all :class:`ByteBlock`\\s in this interval.
    :ivar ~.symbolic_expressions: A mapping, from offset in the interval, to a
        :class:`SymbolicExpression` in the interval.
    """

    class _BlockSet(SetWrapper[ByteBlock]):
        def __init__(
            self, node: "ByteInterval", *args: typing.Iterable[ByteBlock]
        ):
            super().__init__()
            self._node = node
            self.update(*args)

        def add(self, v: ByteBlock) -> None:
            # We're defining add in terms of update so that we can optimize
            # adding multiple blocks at once.
            self.update((v,))

        def update(self, *iterables: typing.Iterable[ByteBlock]) -> None:
            node_ir = self._node.ir
            new_items = set(*iterables) - self._data
            for v in new_items:
                if v._byte_interval is not None:
                    v._byte_interval.blocks.discard(v)
                v._byte_interval = self._node
                if node_ir is not None:
                    v._add_to_uuid_cache(node_ir._local_uuid_cache)

            self._node._index_add_multiple(self._data, new_items)
            self._data.update(new_items)

        def discard(self, v: ByteBlock) -> None:
            if v not in self:
                return
            self._node._index_discard(v)
            v._byte_interval = None
            if self._node.ir is not None:
                v._remove_from_uuid_cache(self._node.ir._local_uuid_cache)
            return super().discard(v)

    class _SymbolicExprDict(DictWrapper[int, SymbolicExpression]):
        def __init__(
            self,
            interval: "ByteInterval",
            *args: DictLike[int, SymbolicExpression],
        ):
            # Do not call the DictWrapper constructor: _SymbolicExprDict needs
            # to store data in a SortedDict, not a regular dict.
            self._interval = interval
            self._data: "SortedDict[int, SymbolicExpression]" = SortedDict()
            temp: typing.Dict[int, SymbolicExpression] = dict(*args)
            for i, v in temp.items():
                self[i] = v

        def __repr__(self) -> str:
            # We can't just return the repr of self._data because it will
            # create a SortedDict and that isn't part of our public interface.
            items = (
                "{!r}: {!r}".format(key, value)
                for key, value in self._data.items()
            )
            return "{" + ", ".join(items) + "}"

    address = _IndexedAttribute[typing.Optional[int]]()(
        lambda self: self.section
    )
    size = _IndexedAttribute[int]()(lambda self: self.section)

    def __init__(
        self,
        *,
        address: typing.Optional[int] = None,
        size: typing.Optional[int] = None,
        initialized_size: typing.Optional[int] = None,
        contents: typing.ByteString = b"",
        blocks: typing.Iterable[ByteBlock] = (),
        symbolic_expressions: DictLike[int, SymbolicExpression] = {},
        uuid: typing.Optional[UUID] = None,
        section: typing.Optional["Section"] = None,
    ):
        """
        :param address: The fixed address of this interval, if present.
        :param size: The size of this interval in bytes.
        :param initialized_size: The number of initialized bytes in this
            interval.
        :param contents: The bytes stored in this interval.
        :param blocks: A set of all :class:`ByteBlock`\\s in this interval.
        :param symbolic_expressions: A mapping, from offset in the interval, to
            a :class:`SymbolicExpression` in the interval.
        :param uuid: The UUID of this ``ByteInterval``,
            or None if a new UUID needs generated via :func:`uuid.uuid4`.
            Defaults to None.
        :param section: The :class:`Section` this interval belongs to.
        """

        if size is None:
            size = len(contents)
        if initialized_size is None:
            initialized_size = len(contents)
        if initialized_size > size:
            raise ValueError("initialized_size must be <= size!")

        super().__init__(uuid=uuid)
        self._section: typing.Optional["Section"] = None
        self.address = address
        self.size = size
        self.contents = bytearray(contents)
        self.initialized_size = initialized_size

        # Both blocks and _interval_tree must exist before adding any blocks.
        self.blocks: SetWrapper[ByteBlock] = ByteInterval._BlockSet(self)
        self._interval_tree = LazyIntervalTree[int, ByteBlock](
            self.blocks, _offset_interval
        )
        self.blocks.update(blocks)

        self._symbolic_expressions = ByteInterval._SymbolicExprDict(
            self, symbolic_expressions
        )
        self._proto_interval: typing.Optional[
            ByteInterval_pb2.ByteInterval
        ] = None

        # Use the property setter to ensure correct invariants.
        self.section = section

    def _index_add_multiple(
        self,
        old_blocks: typing.Collection[ByteBlock],
        new_blocks: typing.Collection[ByteBlock],
    ) -> None:
        for block in new_blocks:
            self._interval_tree.add(block)

    def _index_add(self, block: ByteBlock) -> None:
        self._interval_tree.add(block)

    def _index_discard(self, block: ByteBlock) -> None:
        self._interval_tree.discard(block)

    @property
    def initialized_size(self) -> int:
        """The number of initialized bytes in this interval.

        Not all bytes in this interval may correspond to bytes physically
        stored in the underlying file format. This can occur, for example, in
        BSS sections, which are zero-initialized at loadtime, but these zeroes
        are not stored in the file itself. If this number is smaller than
        ``size``, this indicates that any bytes past this number are
        unitialized bytes with values determined at loadtime. As such, all
        bytes past this number in this interval's byte vector are truncated
        when saving to file.
        """

        return len(self.contents)

    @initialized_size.setter
    def initialized_size(self, value: int) -> None:
        if value > len(self.contents):
            self.contents += b"\0" * (value - len(self.contents))
        elif value < len(self.contents):
            self.contents = self.contents[:value]

    @classmethod
    def _decode_protobuf(
        cls,
        proto_interval: _NodeMessage,
        uuid: UUID,
        ir: typing.Optional["IR"],
    ) -> "ByteInterval":
        assert ir
        assert isinstance(proto_interval, ByteInterval_pb2.ByteInterval)

        def decode_block(proto_block: ByteInterval_pb2.Block) -> ByteBlock:
            block: ByteBlock
            if proto_block.HasField("code"):
                block = CodeBlock._from_protobuf(proto_block.code, ir)
            elif proto_block.HasField("data"):
                block = DataBlock._from_protobuf(proto_block.data, ir)
            else:
                raise TypeError(
                    "Unknown type inside proto block: %s"
                    % proto_block.WhichOneof("value")
                )

            block.offset = proto_block.offset
            return block

        # we do not decode symbolic expressions yet, because symbols have
        # not yet been decoded at this point.
        result = cls(
            address=proto_interval.address
            if proto_interval.has_address
            else None,
            size=proto_interval.size,
            contents=proto_interval.contents,
            uuid=uuid,
            blocks=(decode_block(b) for b in proto_interval.blocks),
        )
        result._add_to_uuid_cache(ir._local_uuid_cache)
        # We store the interval and IR here so we can use it later, when
        # _decode_symbolic_expressions is called.
        result._proto_interval = proto_interval
        # Return the new BI.
        return result

    def _decode_symbolic_expressions(self, ir: "IR") -> None:
        """Called by modules after symbols are decoded, but before the module
        is done decoding.
        """
        assert self._proto_interval

        def decode_symbolic_expression(
            proto_expr: SymbolicExpression_pb2.SymbolicExpression,
        ) -> SymbolicExpression:
            if proto_expr.HasField("addr_const"):
                return SymAddrConst._from_protobuf(
                    proto_expr.addr_const, ir.get_by_uuid
                )
            elif proto_expr.HasField("addr_addr"):
                return SymAddrAddr._from_protobuf(
                    proto_expr.addr_addr, ir.get_by_uuid
                )
            else:
                raise TypeError(
                    "Unknown type inside proto sym expr: %s"
                    % proto_expr.WhichOneof("value")
                )

        self.symbolic_expressions = {}
        for i, v in self._proto_interval.symbolic_expressions.items():
            expr = decode_symbolic_expression(v)
            for f in v.attribute_flags:
                try:
                    expr.attributes.add(SymbolicExpression.Attribute(f))
                except ValueError:
                    expr.attributes.add(f)
            self.symbolic_expressions[i] = expr

        del self._proto_interval

    def _to_protobuf(self) -> ByteInterval_pb2.ByteInterval:
        proto_interval = ByteInterval_pb2.ByteInterval()

        proto_interval.uuid = self.uuid.bytes
        if self.address is None:
            proto_interval.has_address = False
        else:
            proto_interval.has_address = True
            proto_interval.address = self.address
        proto_interval.size = self.size
        proto_interval.contents = bytes(self.contents)

        # Cannot insert blocks using proto_interval.blocks.append() in a loop
        # because append() isn't supported in older versions of protobuf. Use a
        # comprehension and extend() instead.

        def to_proto_block(block: ByteBlock) -> ByteInterval_pb2.Block:
            proto_block = ByteInterval_pb2.Block()
            proto_block.offset = block.offset
            if isinstance(block, CodeBlock):
                proto_block.code.CopyFrom(block._to_protobuf())
            elif isinstance(block, DataBlock):
                proto_block.data.CopyFrom(block._to_protobuf())
            else:
                raise TypeError(
                    "Unknown block type in interval: %s" % type(block)
                )
            return proto_block

        proto_interval.blocks.extend(to_proto_block(b) for b in self.blocks)

        for k, v in self.symbolic_expressions.items():
            sym_exp = SymbolicExpression_pb2.SymbolicExpression()
            if isinstance(v, SymAddrConst):
                sym_exp.addr_const.CopyFrom(v._to_protobuf())
            elif isinstance(v, SymAddrAddr):
                sym_exp.addr_addr.CopyFrom(v._to_protobuf())
            else:
                raise ValueError(
                    "Expected sym expr type in interval: %s" % type(v)
                )
            attrs = (
                a.value if isinstance(a, SymbolicExpression.Attribute) else a
                for a in v.attributes
            )
            sym_exp.attribute_flags.extend(attrs)
            proto_interval.symbolic_expressions[k].CopyFrom(sym_exp)

        return proto_interval

    @property
    def section(self) -> typing.Optional["Section"]:
        """The :class:`Section` this interval belongs to."""

        return self._section

    @section.setter
    def section(self, value: typing.Optional["Section"]) -> None:
        if self._section is not None:
            self._section.byte_intervals.discard(self)
        if value is not None:
            value.byte_intervals.add(self)

    @property
    def symbolic_expressions(
        self,
    ) -> typing.MutableMapping[int, SymbolicExpression]:
        return self._symbolic_expressions

    @symbolic_expressions.setter
    def symbolic_expressions(
        self, value: typing.Dict[int, SymbolicExpression]
    ) -> None:
        self._symbolic_expressions.clear()
        self._symbolic_expressions.update(value)

    def deep_eq(self, other: object) -> bool:
        # Do not move __eq__. See docstring for Node.deep_eq for more info.
        if not isinstance(other, ByteInterval):
            return False
        return (
            self.uuid == other.uuid
            and self.address == other.address
            and self.contents == other.contents
            and self.size == other.size
            and len(self.blocks) == len(other.blocks)
            and all(
                self_node.deep_eq(other_node)
                for self_node, other_node in zip(
                    sorted(self.blocks, key=lambda b: b.uuid),
                    sorted(other.blocks, key=lambda b: b.uuid),
                )
            )
            and len(self.symbolic_expressions)
            == len(other.symbolic_expressions)
            and all(
                self_kv[0] == other_kv[0] and self_kv[1].deep_eq(other_kv[1])
                for self_kv, other_kv in zip(
                    sorted(
                        self.symbolic_expressions.items(), key=lambda kv: kv[0]
                    ),
                    sorted(
                        other.symbolic_expressions.items(),
                        key=lambda kv: kv[0],
                    ),
                )
            )
        )

    def __repr__(self) -> str:

        return (
            "ByteInterval("
            "uuid={uuid!r}, "
            "address={address}, "
            "size={size}, "
            "contents={contents!r}, "
            "blocks={blocks!r}, "
            "symbolic_expressions={symbolic_expressions!r}, "
            ")".format(
                uuid=self.uuid,
                address=self.address,
                size=self.size,
                contents=self.contents,
                blocks=self.blocks,
                symbolic_expressions=self.symbolic_expressions,
            )
        )

    def byte_blocks_on(
        self, addrs: typing.Union[int, range]
    ) -> typing.Iterable[ByteBlock]:
        """Finds all the byte blocks that overlap an address or range of
        addresses.

        :param addrs: Either a ``range`` object or a single address.
        """

        if self.address is None:
            return ()

        return _nodes_on_interval_tree(
            self._interval_tree.get(), addrs, -self.address
        )

    def byte_blocks_at(
        self, addrs: typing.Union[int, range]
    ) -> typing.Iterable[ByteBlock]:
        """Finds all the byte blocks that begin at an address or range of
        addresses.

        :param addrs: Either a ``range`` object or a single address.
        """

        if self.address is None:
            return ()

        return _nodes_at_interval_tree(
            self._interval_tree.get(), addrs, -self.address
        )

    def code_blocks_on(
        self, addrs: typing.Union[int, range]
    ) -> typing.Iterable[CodeBlock]:
        """Finds all the code blocks that overlap an address or range of
        addresses.

        :param addrs: Either a ``range`` object or a single address.
        """

        return (
            b for b in self.byte_blocks_on(addrs) if isinstance(b, CodeBlock)
        )

    def code_blocks_at(
        self, addrs: typing.Union[int, range]
    ) -> typing.Iterable[CodeBlock]:
        """Finds all the code blocks that begin at an address or range of
        addresses.

        :param addrs: Either a ``range`` object or a single address.
        """

        return (
            b for b in self.byte_blocks_at(addrs) if isinstance(b, CodeBlock)
        )

    def data_blocks_on(
        self, addrs: typing.Union[int, range]
    ) -> typing.Iterable[DataBlock]:
        """Finds all the data blocks that overlap an address or range of
        addresses.

        :param addrs: Either a ``range`` object or a single address.
        """

        return (
            b for b in self.byte_blocks_on(addrs) if isinstance(b, DataBlock)
        )

    def data_blocks_at(
        self, addrs: typing.Union[int, range]
    ) -> typing.Iterable[DataBlock]:
        """Finds all the data blocks that begin at an address or range of
        addresses.

        :param addrs: Either a ``range`` object or a single address.
        """

        return (
            b for b in self.byte_blocks_at(addrs) if isinstance(b, DataBlock)
        )

    def byte_blocks_on_offset(
        self, offsets: typing.Union[int, range]
    ) -> typing.Iterable[ByteBlock]:
        """
        Finds all the byte blocks that overlap an offset or range of offsets.

        :param offsets: Either a ``range`` object or a single offset.
        """

        return _nodes_on_interval_tree_offset(
            self._interval_tree.get(), offsets
        )

    def byte_blocks_at_offset(
        self, offsets: typing.Union[int, range]
    ) -> typing.Iterable[ByteBlock]:
        """
        Finds all the byte blocks that begin at an offset or range of offsets.

        :param offsets: Either a ``range`` object or a single offset.
        """

        return _nodes_at_interval_tree_offset(
            self._interval_tree.get(), offsets
        )

    def code_blocks_on_offset(
        self, offsets: typing.Union[int, range]
    ) -> typing.Iterable[CodeBlock]:
        """
        Finds all the code blocks that overlap an offset or range of offsets.

        :param offsets: Either a ``range`` object or a single offset.
        """

        return (
            b
            for b in self.byte_blocks_on_offset(offsets)
            if isinstance(b, CodeBlock)
        )

    def code_blocks_at_offset(
        self, offsets: typing.Union[int, range]
    ) -> typing.Iterable[CodeBlock]:
        """
        Finds all the code blocks that begin at an offset or range of offsets.

        :param offsets: Either a ``range`` object or a single offset.
        """

        return (
            b
            for b in self.byte_blocks_at_offset(offsets)
            if isinstance(b, CodeBlock)
        )

    def data_blocks_on_offset(
        self, offsets: typing.Union[int, range]
    ) -> typing.Iterable[DataBlock]:
        """
        Finds all the data blocks that overlap an offset or range of offsets.

        :param offsets: Either a ``range`` object or a single offset.
        """

        return (
            b
            for b in self.byte_blocks_on_offset(offsets)
            if isinstance(b, DataBlock)
        )

    def data_blocks_at_offset(
        self, offsets: typing.Union[int, range]
    ) -> typing.Iterable[DataBlock]:
        """
        Finds all the data blocks that begin at an offset or range of offsets.

        :param offsets: Either a ``range`` object or a single offset.
        """

        return (
            b
            for b in self.byte_blocks_at_offset(offsets)
            if isinstance(b, DataBlock)
        )

    def symbolic_expressions_at(
        self, addrs: typing.Union[int, range]
    ) -> typing.Iterable[SymbolicExpressionElement]:
        """Finds all the symbolic expressions that begin at an address or
        range of addresses.

        :param addrs: Either a ``range`` object or a single address.
        :returns: Yields ``(interval, offset, symexpr)`` tuples for every
            symbolic expression in the range.
        """

        if self.address is None:
            return

        addrs = get_desired_range(addrs)
        for i in self._symbolic_expressions._data.irange(
            addrs.start - self.address,
            addrs.stop - self.address,
            inclusive=(True, False),
        ):
            if self.address + i in addrs:
                yield (self, i, self.symbolic_expressions[i])

    def symbolic_expressions_at_offset(
        self, offsets: typing.Union[int, range]
    ) -> typing.Iterable[SymbolicExpressionElement]:
        """
        Finds all the symbolic expressions that begin at an offset or range of
        offsets.

        :param addrs: Either a ``range`` object or a single offset.
        :returns: Yields ``(interval, offset, symexpr)`` tuples for every
            symbolic expression in the range.
        """

        offsets = get_desired_range(offsets)
        for i in self._symbolic_expressions._data.irange(
            offsets.start,
            offsets.stop,
            inclusive=(True, False),
        ):
            if i in offsets:
                yield (self, i, self.symbolic_expressions[i])

    def _add_to_uuid_cache(self, cache: typing.Dict[UUID, Node]) -> None:
        """Update the UUID cache when this node is added."""

        cache[self.uuid] = self
        for block in self.blocks:
            block._add_to_uuid_cache(cache)

    def _remove_from_uuid_cache(self, cache: typing.Dict[UUID, Node]) -> None:
        """Update the UUID cache when this node is removed."""

        del cache[self.uuid]
        for block in self.blocks:
            block._remove_from_uuid_cache(cache)

    @property
    def module(self) -> typing.Optional["Module"]:
        """Get the module this node ultimately belongs to."""
        if self.section is None:
            return None
        return self.section.module

    @property
    def ir(self) -> typing.Optional["IR"]:
        """Get the IR this node ultimately belongs to."""
        if self.module is None:
            return None
        return self.module.ir


================================================
FILE: python/gtirb/cfg.py
================================================
from enum import Enum
from typing import (
    TYPE_CHECKING,
    Hashable,
    Iterable,
    Iterator,
    MutableSet,
    NamedTuple,
    Optional,
    Tuple,
)
from uuid import UUID

from networkx import MultiDiGraph

from .block import CfgNode
from .proto import CFG_pb2
from .util import DeserializationError

if TYPE_CHECKING:  # pragma: no cover
    from .ir import IR


class EdgeType(Enum):
    """The type of control flow transfer indicated by a
    :class:`gtirb.Edge`.
    """

    Branch = CFG_pb2.EdgeType.Value("Type_Branch")
    """This edge is the explicit target of a jump instruction.
    May be conditional or unconditional. If conditional, there will be
    a corresponding edge of type :attr:`gtirb.Edge.Type.Fallthrough`.
    """

    Call = CFG_pb2.EdgeType.Value("Type_Call")
    """This edge is the explicit target of a call instruction.
    Unless the function does not return, there will also be a
    corresponding edge of type :attr:`gtirb.Edge.Type.Fallthrough`.
    """

    Fallthrough = CFG_pb2.EdgeType.Value("Type_Fallthrough")
    """This edge represents two blocks executing in sequence.
    This occurs on the non-branching paths of conditional branch
    instructions, after call instructons have returned, and when two
    blocks have no control flow between them, but another
    :class:`gtirb.Edge` targets the target block.
    If there exists a fallthrough edge from block ``A`` to block ``B``,
    then ``A`` must immediately precede ``B`` in memory.
    """

    Return = CFG_pb2.EdgeType.Value("Type_Return")
    """This edge represents a return from a function, generally via a
    return instruction. Return edges may either go to a symbolless
    :class:`gtirb.ProxyBlock`, which indicates that the set of possible
    return targets is unknown, or there may be one return edge per
    return target, which indicates that the set of possible return targets
    if fully known.
    """

    Syscall = CFG_pb2.EdgeType.Value("Type_Syscall")
    """This edge is the explicit target of a system call instruction.
    Unless the function does not return, there will also be a
    corresponding edge of type :attr:`gtirb.Edge.Type.Fallthrough`. This
    is the system call equivalent to :class:`gtirb.Edge.Type.Call`.
    """

    Sysret = CFG_pb2.EdgeType.Value("Type_Sysret")
    """This edge represents a return from a system call, generally via a
    return instruction. Return edges may either go to a symbolless
    :class:`gtirb.ProxyBlock`, which indicates that the set of possible
    return targets is unknown, or there may be one return edge per
    return target, which indicates that the set of possible return targets
    if fully known. This is the system call equivalent to
    :class:`gtirb.Edge.Type.Return`.
    """


class EdgeLabel(NamedTuple):
    """Contains a more detailed description of a :class:`gtirb.Edge`
    in the CFG.

    :ivar ~.conditional: When this edge is part of a conditional branch,
        ``conditional`` is ``True`` when the edge represents the control
        flow taken when the branch's condition is met, and ``False``
        when it represents the control flow taken when the branch's
        condition is not met. Otherwise, it is always ``False``.
    :ivar ~.direct: ``True`` if the branch or call is direct,
            and ``False`` if it is indirect. If an edge is indirect,
            then all outgoing indirect edges represent the set of
            possible locations the edge may branch to. If there
            exists an indirect outgoing edge to a :class:`gtirb.ProxyBlock`
            without any :class:`gtirb.Symbol` objects referring to it,
            then the set of all possible branch locations is unknown.
    :ivar ~.type: The type of control flow the :class:`gtirb.Edge`
        represents.
    """

    type: EdgeType
    conditional: bool = False
    direct: bool = True

    def __repr__(self) -> str:
        return (
            "Edge.Label("
            "type=Edge.Type.{type.name}, "
            "conditional={conditional!r}, "
            "direct={direct!r}, "
            ")".format(**self._asdict())
        )


class Edge(
    NamedTuple(
        "NamedTuple",
        (
            ("source", CfgNode),
            ("target", CfgNode),
            ("label", Optional[EdgeLabel]),
        ),
    )
):
    """An edge in the CFG from ``source`` to ``target``, with optional
    control-flow details in ``label``.

    :ivar ~.source: The source CFG node.
    :ivar ~.target: The target CFG node.
    :ivar ~.label: An optional label containing more control flow information.
    """

    __slots__ = ()

    def __new__(
        cls,
        source: CfgNode,
        target: CfgNode,
        label: Optional[EdgeLabel] = None,
    ) -> "Edge":
        return super().__new__(cls, source, target, label)

    Type = EdgeType
    Label = EdgeLabel


class CFG(MutableSet[Edge]):
    """A control-flow graph for an :class:`IR`. Vertices are
    :class:`CfgNode`\\s, and edges may optionally contain
    :class:`Edge.Label`\\s.

    The graph may be viewed simply as a set of :class:`Edge`\\s. For
    convenience, the :meth:`out_edges` and :meth:`in_edges` methods provide
    access to the outgoing or incoming edges of individual nodes.

    For efficency, only vertices with edges are guaranteed to be stored in this
    graph. If you want to find all vertices possible (that is, all
    :class:`CfgNode`\\s), use :meth:`IR.cfg_nodes` instead.

    Internally, the graph is stored as a NetworkX instance, which can be
    accessed using :meth:`nx`. This allows NetworkX's large library of graph
    algorithms to be used on CFGs, if desired.
    """

    def __init__(self, edges: Optional[Iterable[Edge]] = None):
        self._nxg: "MultiDiGraph[CfgNode, Hashable, Optional[EdgeLabel]]" = (
            MultiDiGraph()
        )
        if edges is not None:
            self.update(edges)

    def _edge_key(self, edge: Edge) -> Optional[Hashable]:
        if edge.source in self._nxg:
            neighbors = self._nxg[edge.source]
            if edge.target in neighbors:
                for key, e in neighbors[edge.target].items():
                    if "label" in e and e["label"] == edge.label:
                        return key
        return None

    def __contains__(self, edge: object) -> bool:
        return isinstance(edge, Edge) and self._edge_key(edge) is not None

    def __iter__(self) -> Iterator[Edge]:
        for s, t, l in self._nxg.edges(data="label"):
            yield Edge(s, t, l)

    def __len__(self) -> int:
        return len(self._nxg.edges())

    def update(self, edges: Iterable[Edge]) -> None:
        for edge in edges:
            self.add(edge)

    def add(self, edge: Edge) -> None:
        if edge not in self:
            self._nxg.add_edge(edge.source, edge.target, label=edge.label)

    def clear(self) -> None:
        self._nxg.clear()

    def discard(self, edge: Edge) -> None:
        key = self._edge_key(edge)
        if key is not None:
            self._nxg.remove_edge(edge.source, edge.target, key=key)

    def out_edges(self, node: CfgNode) -> Iterator[Edge]:
        if node in self._nxg:
            for s, t, l in self._nxg.out_edges(node, data="label"):
                yield Edge(s, t, l)

    def in_edges(self, node: CfgNode) -> Iterator[Edge]:
        if node in self._nxg:
            for s, t, l in self._nxg.in_edges(node, data="label"):
                yield Edge(s, t, l)

    @classmethod
    def _from_protobuf(
        cls, edges: Iterable[CFG_pb2.Edge], ir: Optional["IR"]
    ) -> "CFG":
        assert ir

        def make_edge(ir: "IR", edge: CFG_pb2.Edge) -> Edge:
            source_uuid = UUID(bytes=edge.source_uuid)
            source = ir.get_by_uuid(source_uuid)
            if not isinstance(source, CfgNode):
                raise DeserializationError(
                    "CFG: UUID %s is not a CfgNode" % source_uuid
                )

            target_uuid = UUID(bytes=edge.target_uuid)
            target = ir.get_by_uuid(target_uuid)
            if not isinstance(target, CfgNode):
                raise DeserializationError(
                    "CFG: UUID %s is not a CfgNode" % target_uuid
                )

            label: Optional[EdgeLabel] = None
            if edge.HasField("label"):
                label = Edge.Label(
                    Edge.Type(edge.label.type),
                    edge.label.conditional,
                    edge.label.direct,
                )

            return Edge(source, target, label)

        return CFG(make_edge(ir, edge) for edge in edges)

    def _to_protobuf(self) -> Iterable[CFG_pb2.Edge]:
        for s, t, l in self._nxg.edges(data="label"):
            proto_edge = CFG_pb2.Edge()
            proto_edge.source_uuid = s.uuid.bytes
            proto_edge.target_uuid = t.uuid.bytes
            if l:
                proto_edge.label.type = l.type.value
                proto_edge.label.conditional = l.conditional
                proto_edge.label.direct = l.direct
            yield proto_edge

    # Note: This returns a "bare" MultiDiGraph because MultiDiGraph is not
    # actually a generic type.
    def nx(self) -> MultiDiGraph:  # type: ignore[type-arg]
        return self._nxg

    def deep_eq(self, other: "CFG") -> bool:
        # Do not move __eq__. See docstring for Node.deep_eq for more info.

        def edge_sort_key(
            edge: Edge,
        ) -> Tuple[UUID, UUID, Optional[Tuple[int, bool, bool]]]:
            label_key = -1, False, False
            if edge.label is not None:
                label_key = (
                    edge.label.type.value,
                    edge.label.conditional,
                    edge.label.direct,
                )
            return (edge.source.uuid, edge.target.uuid, label_key)

        if not isinstance(other, CFG):
            return False

        # We don't have to compare nodes for deep_eq because if an node has no
        # edges, then we do not guarantee that graphs have that node as a
        # vertex, and if it has edges, a failure of deep_eq will be detected
        # when comparing edges.

        if self._nxg.number_of_edges() != other._nxg.number_of_edges():
            return False

        self_edges = sorted(self, key=edge_sort_key)
        other_edges = sorted(other, key=edge_sort_key)

        for self_edge, other_edge in zip(self_edges, other_edges):
            if self_edge.label != other_edge.label:
                return False
            if not self_edge.source.deep_eq(other_edge.source):
                return False
            if not self_edge.target.deep_eq(other_edge.target):
                return False

        return True

    def __repr__(self) -> str:
        return "CFG(%r)" % list(self)


================================================
FILE: python/gtirb/ir.py
================================================
"""The IR is the core class for reading and writing GTIRB files.

    You can open a GTIRB Protobuf file and load it into an IR instance:

    >>> ir = IR.load_protobuf('filename.gtirb')

    And then you can write the IR instance as a Protobuf file:

    >>> ir.save_protobuf('filename.gtirb')
"""

import itertools
import os
import typing
from uuid import UUID

from .auxdata import AuxData, AuxDataContainer
from .block import ByteBlock, CfgNode, CodeBlock, DataBlock, ProxyBlock
from .byteinterval import ByteInterval, SymbolicExpressionElement
from .cfg import CFG, Edge
from .module import Module
from .node import Node, _NodeMessage
from .proto import CFG_pb2, IR_pb2
from .section import Section
from .symbol import Symbol
from .util import (
    DictLike,
    ListWrapper,
    nodes_at,
    nodes_on,
    symbolic_expressions_at,
)
from .version import PROTOBUF_VERSION

GTIRB_MAGIC_CHARS = b"GTIRB"


class IR(AuxDataContainer):
    """A complete internal representation consisting of multiple Modules.

    :ivar ~.modules: A list of :class:`Module`\\s contained in the IR.
    :ivar ~.cfg: The IR's control flow graph.
    :ivar ~.version: The Protobuf version of this IR.
    """

    class _ModuleList(ListWrapper[Module]):
        def __init__(self, node: "IR", *args: typing.Iterable[Module]):
            self._node = node
            super().__init__(*args)

        def _remove(self, v: Module) -> None:
            v._ir = None
            v._remove_from_uuid_cache(self._node._local_uuid_cache)

        def _add(self, v: Module) -> None:
            if v._ir is not None:
                v._ir.modules.remove(v)
            v._ir = self._node
            v._add_to_uuid_cache(self._node._local_uuid_cache)

    def __init__(
        self,
        *,
        modules: typing.Iterable[Module] = [],
        aux_data: DictLike[str, AuxData] = {},
        cfg: typing.Iterable[Edge] = set(),
        version: int = PROTOBUF_VERSION,
        uuid: typing.Optional[UUID] = None,
    ):
        """
        :param modules: A list of Modules contained in the IR.
        :param cfg: A set of :class:`Edge`\\s representing the IR's control
            flow graph. Defaults to being empty.
        :param aux_data: The initial auxiliary data to be associated
            with the object, as a mapping from names to
            :class:`gtirb.AuxData`. Defaults to being empty.
        :param version: The Protobuf version of this IR.
        :param uuid: The UUID of this ``IR``,
            or None if a new UUID needs generated via :func:`uuid.uuid4`.
            Defaults to None.
        """

        self._local_uuid_cache: typing.Dict[UUID, Node] = {}
        # Modules are decoded before the aux data, since the UUID decoder
        # checks Node's cache.
        self.modules = IR._ModuleList(self, modules)
        self.cfg = CFG(cfg)
        self.version = version
        super().__init__(aux_data, uuid)
        self._local_uuid_cache[self.uuid] = self

    @classmethod
    def _decode_protobuf(
        cls, proto_ir: _NodeMessage, uuid: UUID, _: typing.Optional["IR"]
    ) -> "IR":
        assert isinstance(proto_ir, IR_pb2.IR)
        if proto_ir.version != PROTOBUF_VERSION:
            raise ValueError(
                "Attempt to decode IR of version %s (expected version %s)"
                % (proto_ir.version, PROTOBUF_VERSION)
            )

        ir = cls(version=proto_ir.version, uuid=uuid)
        ir.modules.extend(
            Module._from_protobuf(m, ir) for m in proto_ir.modules
        )
        ir.cfg = CFG._from_protobuf(proto_ir.cfg.edges, ir)
        ir.aux_data.update(
            AuxDataContainer._read_protobuf_aux_data(proto_ir.aux_data, ir)
        )
        return ir

    def _to_protobuf(self) -> IR_pb2.IR:
        proto_ir = IR_pb2.IR()
        proto_ir.uuid = self.uuid.bytes
        proto_ir.version = self.version
        proto_ir.modules.extend(m._to_protobuf() for m in self.modules)
        proto_cfg = CFG_pb2.CFG()
        proto_cfg.vertices.extend(v.uuid.bytes for v in self.cfg_nodes)
        proto_cfg.edges.extend(self.cfg._to_protobuf())
        proto_ir.cfg.CopyFrom(proto_cfg)
        self._write_protobuf_aux_data(proto_ir.aux_data)
        return proto_ir

    def deep_eq(self, other: object) -> bool:
        # Do not move __eq__. See docstring for Node.deep_eq for more info.
        if not isinstance(other, IR) or not super().deep_eq(other):
            return False
        self_modules = sorted(self.modules, key=lambda m: m.uuid)
        other_modules = sorted(other.modules, key=lambda m: m.uuid)
        if not len(self_modules) == len(other_modules):
            return False
        for self_module, other_module in zip(self_modules, other_modules):
            if not self_module.deep_eq(other_module):
                return False
        return self.version == other.version and self.cfg.deep_eq(other.cfg)

    @staticmethod
    def load_protobuf_file(protobuf_file: typing.BinaryIO) -> "IR":
        """Load IR from a Protobuf object.

        Use this function when you have a Protobuf object already loaded,
        and you want to parse it as a GTIRB IR.
        If the Protobuf object is stored in a file,
        use :func:`gtirb.IR.load_protobuf` instead.

        :param protobuf_file: A byte stream encoding a GTIRB Protobuf message.
        :returns: An IR object representing the same
            information that is contained in ``protobuf_file``.
        """

        # Magic signature
        # Bytes 0-4 contain the ASCII characters: GTIRB.
        # Bytes 5-6 are considered reserved for future use and should be 0.
        # Byte 7 contains the GTIRB protobuf spec version in use.
        magic = protobuf_file.read(len(GTIRB_MAGIC_CHARS))
        if magic != GTIRB_MAGIC_CHARS:
            raise ValueError("File missing GTIRB magic - not a GTIRB file?")

        protobuf_file.read(1)
        protobuf_file.read(1)

        version = int.from_bytes(protobuf_file.read(1), byteorder="little")
        if version != PROTOBUF_VERSION:
            raise ValueError(
                "Attempt to decode IR of version %s (expected version %s)"
                % (version, PROTOBUF_VERSION)
            )

        ir = IR_pb2.IR()
        ir.ParseFromString(protobuf_file.read())
        return IR._from_protobuf(ir, None)

    @staticmethod
    def load_protobuf(
        file_name: typing.Union[str, "os.PathLike[str]"]
    ) -> "IR":
        """Load IR from a Protobuf file at the specified path.

        :param file_name: The path to the Protobuf file.
        :returns: A Python GTIRB IR object.
        """
        with open(file_name, "rb") as f:
            return IR.load_protobuf_file(f)

    def save_protobuf_file(self, protobuf_file: typing.BinaryIO) -> None:
        """Save ``self`` to a Protobuf object.

        :param protobuf_file: The byte stream to write the GTIRB Protobuf
            message to.
        """

        protobuf_file.write(GTIRB_MAGIC_CHARS)
        protobuf_file.write(b"\0")
        protobuf_file.write(b"\0")
        protobuf_file.write(PROTOBUF_VERSION.to_bytes(1, byteorder="little"))
        protobuf_file.write(self._to_protobuf().SerializeToString())

    def save_protobuf(
        self, file_name: typing.Union[str, "os.PathLike[str]"]
    ) -> None:
        """Save ``self`` to a Protobuf file at the specified path.

        :param file_name: The file path at which to
            save the Protobuf representation of ``self``.
        """
        with open(file_name, "wb") as f:
            self.save_protobuf_file(f)

    def __repr__(self) -> str:
        return (
            "IR("
            "uuid={uuid!r}, "
            "modules={modules!r}, "
            "cfg={cfg!r}, "
            "version={version}, "
            ")".format(**self.__dict__)
        )

    @property
    def proxy_blocks(self) -> typing.Iterator[ProxyBlock]:
        """The :class:`ProxyBlock`\\s in this IR."""

        return itertools.chain.from_iterable(m.proxies for m in self.modules)

    @property
    def sections(self) -> typing.Iterator[Section]:
        """The :class:`Section`\\s in this IR."""

        return itertools.chain.from_iterable(m.sections for m in self.modules)

    @property
    def symbols(self) -> typing.Iterator[Symbol]:
        """The :class:`Symbol`\\s in this IR."""

        return itertools.chain.from_iterable(m.symbols for m in self.modules)

    @property
    def byte_intervals(self) -> typing.Iterator[ByteInterval]:
        """The :class:`ByteInterval`\\s in this IR."""

        return itertools.chain.from_iterable(
            m.byte_intervals for m in self.modules
        )

    @property
    def byte_blocks(self) -> typing.Iterator[ByteBlock]:
        """The :class:`ByteBlock`\\s in this IR."""

        return itertools.chain.from_iterable(
            m.byte_blocks for m in self.modules
        )

    @property
    def code_blocks(self) -> typing.Iterator[CodeBlock]:
        """The :class:`CodeBlock`\\s in this IR."""

        return itertools.chain.from_iterable(
            m.code_blocks for m in self.modules
        )

    @property
    def data_blocks(self) -> typing.Iterator[DataBlock]:
        """The :class:`DataBlock`\\s in this IR."""

        return itertools.chain.from_iterable(
            m.data_blocks for m in self.modules
        )

    @property
    def cfg_nodes(self) -> typing.Iterator[CfgNode]:
        """The :class:`CfgNode`\\s in this IR."""

        return itertools.chain.from_iterable(m.cfg_nodes for m in self.modules)

    def modules_named(self, name: str) -> typing.Iterator[Module]:
        """Find all modules with a given name"""
        return (m for m in self.modules if m.name == name)

    def sections_on(
        self, addrs: typing.Union[int, range]
    ) -> typing.Iterable[Section]:
        """Finds all the sections that overlap an address or range of
        addresses.

        :param addrs: Either a ``range`` object or a single address.
        """

        return nodes_on(self.sections, addrs)

    def sections_at(
        self, addrs: typing.Union[int, range]
    ) -> typing.Iterable[Section]:
        """Finds all the sections that begin at an address or range of
        addresses.

        :param addrs: Either a ``range`` object or a single address.
        """

        return nodes_at(self.sections, addrs)

    def byte_intervals_on(
        self, addrs: typing.Union[int, range]
    ) -> typing.Iterable[ByteInterval]:
        """Finds all the byte intervals that overlap an address or range of
        addresses.

        :param addrs: Either a ``range`` object or a single address.
        """

        return itertools.chain.from_iterable(
            m.byte_intervals_on(addrs) for m in self.modules
        )

    def byte_intervals_at(
        self, addrs: typing.Union[int, range]
    ) -> typing.Iterable[ByteInterval]:
        """Finds all the byte intervals that begin at an address or range of
        addresses.

        :param addrs: Either a ``range`` object or a single address.
        """

        return itertools.chain.from_iterable(
            m.byte_intervals_at(addrs) for m in self.modules
        )

    def byte_blocks_on(
        self, addrs: typing.Union[int, range]
    ) -> typing.Iterable[ByteBlock]:
        """Finds all the byte blocks that overlap an address or range of
        addresses.

        :param addrs: Either a ``range`` object or a single address.
        """

        return itertools.chain.from_iterable(
            m.byte_blocks_on(addrs) for m in self.modules
        )

    def byte_blocks_at(
        self, addrs: typing.Union[int, range]
    ) -> typing.Iterable[ByteBlock]:
        """Finds all the byte blocks that begin at an address or range of
        addresses.

        :param addrs: Either a ``range`` object or a single address.
        """

        return itertools.chain.from_iterable(
            m.byte_blocks_at(addrs) for m in self.modules
        )

    def code_blocks_on(
        self, addrs: typing.Union[int, range]
    ) -> typing.Iterable[CodeBlock]:
        """Finds all the code blocks that overlap an address or range of
        addresses.

        :param addrs: Either a ``range`` object or a single address.
        """

        return itertools.chain.from_iterable(
            m.code_blocks_on(addrs) for m in self.modules
        )

    def code_blocks_at(
        self, addrs: typing.Union[int, range]
    ) -> typing.Iterable[CodeBlock]:
        """Finds all the code blocks that begin at an address or range of
        addresses.

        :param addrs: Either a ``range`` object or a single address.
        """

        return itertools.chain.from_iterable(
            m.code_blocks_at(addrs) for m in self.modules
        )

    def data_blocks_on(
        self, addrs: typing.Union[int, range]
    ) -> typing.Iterable[DataBlock]:
        """Finds all the data blocks that overlap an address or range of
        addresses.

        :param addrs: Either a ``range`` object or a single address.
        """

        return itertools.chain.from_iterable(
            m.data_blocks_on(addrs) for m in self.modules
        )

    def data_blocks_at(
        self, addrs: typing.Union[int, range]
    ) -> typing.Iterable[DataBlock]:
        """Finds all the data blocks that begin at an address or range of
        addresses.

        :param addrs: Either a ``range`` object or a single address.
        """

        return itertools.chain.from_iterable(
            m.data_blocks_at(addrs) for m in self.modules
        )

    def symbolic_expressions_at(
        self, addrs: typing.Union[int, range]
    ) -> typing.Iterable[SymbolicExpressionElement]:
        """Finds all the symbolic expressions that begin at an address or
        range of addresses.

        :param addrs: Either a ``range`` object or a single address.
        :returns: Yields ``(interval, offset, symexpr)`` tuples for every
            symbolic expression in the range.
        """

        return symbolic_expressions_at(self.modules, addrs)

    def get_by_uuid(self, uuid: UUID) -> typing.Optional[Node]:
        """Look up a node by its UUID.

        This method will find any node currently attached to this IR.
        It will not find any nodes attached to other IRs, or not attached to
        any IR.

        :param uuid: The UUID to look up.
        :returns: The Node this UUID corresponds to, or None if no node exists
            with that UUID.
        """

        return self._local_uuid_cache.get(uuid)


================================================
FILE: python/gtirb/lazyintervaltree.py
================================================
"""
Implements a simple wrapper that lazily initializes and updates an
IntervalTree.

GTIRB uses IntervalTrees to accelerate certain operations. However, these
operations are not always needed for a given GTIRB object or by a given GTIRB
analysis. To prevent scripts that do not need the IntervalTrees from wasting
time updating the data structures, the LazyIntervalTree in this module delays
instantiating or updating the tree. Instead, it queues the updates so they can
be rapidly applied when the script invokes an operation that requires an
up-to-date tree.
"""

import enum
from typing import (
    Collection,
    Generic,
    Iterator,
    List,
    Optional,
    Tuple,
    TypeVar,
)

from intervaltree import Interval, IntervalTree
from typing_extensions import Protocol

_K = TypeVar("_K")
_Kco = TypeVar("_Kco", covariant=True)
_V = TypeVar("_V")


class _EventType(enum.Enum):
    """Whether an interval is to be added or discarded."""

    ADDED = enum.auto()
    DISCARDED = enum.auto()


class IntervalBuilder(Protocol[_Kco, _V]):
    """Gets an interval for certain values.

    If no interval is available for a particular value, returns None instead.
    """

    def __call__(self, node: _V) -> Optional["Interval[_Kco, _V]"]:
        ...


class LazyIntervalTree(Generic[_K, _V]):
    """Simple wrapper to lazily initialize and update an IntervalTree.

    The underlying IntervalTree can be retrieved by calling get(). This will
    ensure that the tree is up-to-date with all intermediate modifications
    before returning it.

    In many algorithms, the tree may receive large numbers of modifications,
    adding and removing the same intervals several times before querying. In
    these cases, it may be faster to rebuild the tree from scratch rather than
    perform all of the intermediate modifications. For this reason, get() is
    not guaranteed to always return the same tree object. That is, the tree
    returned by get() should not be cached; calling get() may return a new tree
    rather than updating the tree it returned previously.
    """

    def __init__(
        self,
        values: Collection[_V],
        make_interval: IntervalBuilder[_K, _V],
    ):
        """Create a new lazy tree.

        :param values: collection of values from which the tree can be rebuilt
        :param make_interval: callable to get an interval for a value
        """
        self._interval_index: Optional["IntervalTree[_K, _V]"] = None
        self._interval_events: List[Tuple[_EventType, "Interval[_K, _V]"]] = []
        self._value_collection = values
        self._make_interval = make_interval

    def add(self, value: _V) -> None:
        """Add a value to the tree."""
        interval = self._make_interval(value)
        if interval is not None:
            self._interval_events.append((_EventType.ADDED, interval))

    def discard(self, value: _V) -> None:
        """Remove a value from the tree.

        Does nothing if the interval with that value is not present.
        """
        interval = self._make_interval(value)
        if interval is not None:
            self._interval_events.append((_EventType.DISCARDED, interval))

    def get(self) -> "IntervalTree[_K, _V]":
        """Get the most up-to-date tree reflecting all pending updates."""

        def intervals() -> Iterator["Interval[_K, _V]"]:
            for value in self._value_collection:
                interval = self._make_interval(value)
                if interval:
                    yield interval

        if self._interval_index is None:
            self._interval_index = IntervalTree(intervals())
        elif len(self._value_collection) <= len(self._interval_events):
            # Constructing a new tree involves one update for each value.
            self._interval_index = IntervalTree(intervals())
        else:
            # There are fewer updates than constructing a new tree would use.
            for event, interval in self._interval_events:
                if event == _EventType.ADDED:
                    self._interval_index.add(interval)
                else:
                    self._interval_index.discard(interval)
        self._interval_events.clear()
        return self._interval_index


================================================
FILE: python/gtirb/module.py
================================================
import collections
import itertools
import typing
from enum import Enum
from uuid import UUID

from .auxdata import AuxData, AuxDataContainer
from .block import ByteBlock, CfgNode, CodeBlock, DataBlock, ProxyBlock
from .byteinterval import ByteInterval, SymbolicExpressionElement
from .node import Node, _NodeMessage
from .proto import Module_pb2
from .section import Section
from .symbol import Symbol
from .util import (
    DeserializationError,
    DictLike,
    SetWrapper,
    nodes_at,
    nodes_on,
    symbolic_expressions_at,
)

if typing.TYPE_CHECKING:  # pragma: no cover
    # Ignore flake8 "imported but unused" errors.
    from .block import Block  # noqa: F401
    from .ir import IR  # noqa: F401


_T = typing.TypeVar("_T", bound=typing.Union[ProxyBlock, Section, Symbol])


class Module(AuxDataContainer):
    """Represents a loadable object, such as an executable or library.

    :ivar ~.binary_path: The path to the loadable binary object
        represented by this module. An empty string if not specified.
        The file represented by this path is indicitave of what file
        this ``Module`` was initially created from; it is not guaranteed to
        currently exist or have the same contents.
    :ivar ~.isa: The ISA of the binary.
    :ivar ~.file_format: The file format of the binary.
    :ivar ~.byte_order: The endianness of the binary.
    :ivar ~.name: The name given to the binary. Some file formats use this
        for linking and/or symbol resolution purposes. The file name (without
        directory components) if not specified by the format.
    :ivar ~.preferred_addr: The preferred loading address of the binary.
    :ivar ~.proxies: A set containing all the :class:`gtirb.ProxyBlock`\\s
        in the binary.
    :ivar ~.rebase_delta: The rebase delta of the binary.
    :ivar ~.sections: A set containing all the :class:`gtirb.Section`\\s
        in the binary.
    :ivar ~.symbols: A set containing all the :class:`gtirb.Symbol`\\s
        in the binary.
    :ivar ~.entry_point: A :class:`CodeBlock` representing where
        control flow of this module begins at, or None if not present.
    """

    class FileFormat(Enum):
        """Identifies the executable file format of the binary represented
        by a :class:`gtirb.Module`.
        """

        Undefined = Module_pb2.FileFormat.Value("Format_Undefined")
        """A file format that has not yet been specified.
        This is for unitialized modules; do not use to refer to
        file formats without ``FileFormat`` values.
        """

        COFF = Module_pb2.FileFormat.Value("COFF")
        """The Common Object File Format."""

        ELF = Module_pb2.FileFormat.Value("ELF")
        """The Executable and Linkable Format,
        formerly the Extensible Linking Format.
        """

        IdaProDb32 = Module_pb2.FileFormat.Value("IdaProDb32")
        """A 32-bit IDA Pro database file."""

        IdaProDb64 = Module_pb2.FileFormat.Value("IdaProDb64")
        """A 64-bit IDA Pro database file."""

        MACHO = Module_pb2.FileFormat.Value("MACHO")
        """A Mach object file."""

        PE = Module_pb2.FileFormat.Value("PE")
        """Microsoft's Portable Executable format."""

        RAW = Module_pb2.FileFormat.Value("RAW")
        """A raw binary file, with no file format."""

        XCOFF = Module_pb2.FileFormat.Value("XCOFF")
        """The Extended Common Object File Format."""

    class ISA(Enum):
        """Identifies the instruction set architecture (ISA)
        targeted by a :class:`gtirb.Module`.
        """

        Undefined = Module_pb2.ISA.Value("ISA_Undefined")
        """An ISA that has not yet been specified.
        This is for unitialized modules;
        use :class:`gtirb.Module.ISA.ValidButUnsupported`
        instead for specifying undefined ISAs.
        """

        ARM = Module_pb2.ISA.Value("ARM")
        """The Acorn RISC Machine, 32-bit."""

        ARM64 = Module_pb2.ISA.Value("ARM64")
        """The Acorn RISC Machine, 64-bit."""

        IA32 = Module_pb2.ISA.Value("IA32")
        """The 32-bit Intel Architecture. Also known as i386, x86, or x32."""

        PPC32 = Module_pb2.ISA.Value("PPC32")
        """IBM's 32-bit PowerPC (Performance Optimization with Enhanced RISC /
        Performance Computing) architecture."""

        PPC64 = Module_pb2.ISA.Value("PPC64")
        """IBM's 64-bit PowerPC (Performance Optimization with Enhanced RISC /
        Performance Computing) architecture."""

        MIPS32 = Module_pb2.ISA.Value("MIPS32")
        """Microprocessor without Interlocked Pipelined Stages, 32-bit."""

        MIPS64 = Module_pb2.ISA.Value("MIPS64")
        """Microprocessor without Interlocked Pipelined Stages, 64-bit."""

        X64 = Module_pb2.ISA.Value("X64")
        """The 64-bit Intel Architecture. Also known as x86_64."""

        ValidButUnsupported = Module_pb2.ISA.Value("ValidButUnsupported")
        """An unknown or undefined ISA."""

    class ByteOrder(Enum):
        """Identifies the endianness of a :class:`gtirb.Module`."""

        Undefined = Module_pb2.ByteOrder.Value("ByteOrder_Undefined")
        """An unknown or uninitialized endianness."""

        Big = Module_pb2.ByteOrder.Value("BigEndian")
        """Big endian."""

        Little = Module_pb2.ByteOrder.Value("LittleEndian")
        """Little endian."""

    class _NodeSet(SetWrapper[_T]):
        def __init__(
            self, node: "Module", field: str, *args: typing.Iterable[_T]
        ):
            self._node: Module = node
            self._field: str = field
            super().__init__(*args)

        def add(self, v: _T) -> None:
            if v._module is not None:
                getattr(v._module, self._field).discard(v)
            v._module = self._node
            self._node._index_add(v)
            if self._node.ir is not None:
                v._add_to_uuid_cache(self._node.ir._local_uuid_cache)
            return super().add(v)

        def discard(self, v: _T) -> None:
            if v not in self:
                return
            v._module = None
            self._node._index_discard(v)
            if self._node.ir is not None:
                v._remove_from_uuid_cache(self._node.ir._local_uuid_cache)
            return super().discard(v)

    def __init__(
        self,
        *,
        name: str,
        aux_data: DictLike[str, AuxData] = {},
        binary_path: str = "",
        file_format: FileFormat = FileFormat.Undefined,
        isa: ISA = ISA.Undefined,
        byte_order: ByteOrder = ByteOrder.Undefined,
        preferred_addr: int = 0,
        proxies: typing.Iterable[ProxyBlock] = set(),
        rebase_delta: int = 0,
        sections: typing.Iterable[Section] = set(),
        symbols: typing.Iterable[Symbol] = set(),
        entry_point: typing.Optional[CodeBlock] = None,
        uuid: typing.Optional[UUID] = None,
        ir: typing.Optional["IR"] = None,
    ):
        """
        :param aux_data: The initial auxiliary data to be associated
            with the object, as a mapping from names to
            :class:`gtirb.AuxData`, defaults to an empty :class:`dict`.
        :param binary_path: The path to the loadable binary object
            represented by this module.
        :param isa: The ISA of the binary.
        :param byte_order: The endianness of the binary.
        :param file_format: The file format of the binary.
        :param name: The name given to the binary.
        :param preferred_addr: The preferred loading address of the binary.
        :param proxies: A set containing all the :class:`gtirb.ProxyBlock`\\s
            in the binary.
        :param rebase_delta: The rebase delta of the binary.
        :param sections: A set containing all the :class:`gtirb.Section`\\s
            in the binary.
        :param symbols: A set containing all the :class:`gtirb.Symbol`\\s
            in the binary.
        :param entry_point: A :class:`CodeBlock` representing where
            control flow of this module begins at, or None if not present.
        :param uuid: The UUID of this ``Module``,
            or None if a new UUID needs generated via :func:`uuid.uuid4`.
            Defaults to None.
        :param ir: The :class:`IR` this module belongs to.
        """

        self._symbol_name_index: typing.MutableMapping[
            str, typing.Set[Symbol]
        ] = collections.defaultdict(set)
        self._symbol_referent_index: typing.MutableMapping[
            "Block", typing.Set[Symbol]
        ] = collections.defaultdict(set)
        self._ir: typing.Optional["IR"] = None
        self.binary_path = binary_path
        self.isa = isa
        self.byte_order = byte_order
        self.file_format = file_format
        self.name = name
        self.preferred_addr = preferred_addr
        self.proxies = Module._NodeSet(self, "proxies", proxies)
        self.rebase_delta = rebase_delta
        self.sections = Module._NodeSet(self, "sections", sections)
        self.symbols = Module._NodeSet(self, "symbols", symbols)
        self.entry_point = entry_point
        # Initialize the aux data last so that the cache is populated
        super().__init__(aux_data, uuid)

        # Use the property setter to ensure correct invariants.
        self.ir = ir

    @classmethod
    def _decode_protobuf(
        cls,
        proto_module: _NodeMessage,
        uuid: UUID,
        ir: typing.Optional["IR"],
    ) -> "Module":
        assert ir
        assert isinstance(proto_module, Module_pb2.Module)
        m = cls(
            binary_path=proto_module.binary_path,
            isa=Module.ISA(proto_module.isa),
            file_format=Module.FileFormat(proto_module.file_format),
            name=proto_module.name,
            preferred_addr=proto_module.preferred_addr,
            rebase_delta=proto_module.rebase_delta,
            byte_order=Module.ByteOrder(proto_module.byte_order),
            uuid=uuid,
        )
        m._add_to_uuid_cache(ir._local_uuid_cache)

        # proxies depend on nothing
        m.proxies.update(
            ProxyBlock._from_protobuf(p, ir) for p in proto_module.proxies
        )
        # sections depend on symbolic expressions, so that step is split out
        # from _decode_protobuf into _decode_symbolic_expressions
        m.sections.update(
            Section._from_protobuf(s, ir) for s in proto_module.sections
        )
        # entry point is a code block, which depends on sections
        m.entry_point = None
        if proto_module.entry_point:
            entry_point_uuid = UUID(bytes=proto_module.entry_point)
            entry_point = ir.get_by_uuid(entry_point_uuid)
            if not isinstance(entry_point, CodeBlock):
                raise DeserializationError(
                    "Module: entry block UUID %s is not a CodeBlock"
                    % entry_point_uuid
                )
            m.entry_point = entry_point
        # symbols depend on blocks
        m.symbols.update(
            Symbol._from_protobuf(s, ir) for s in proto_module.symbols
        )
        # symbolic expressions depend on symbols
        for section in m.sections:
            for interval in section.byte_intervals:
                interval._decode_symbolic_expressions(ir)
        # aux data may depend on any node
        m.aux_data.update(
            AuxDataContainer._read_protobuf_aux_data(proto_module.aux_data, ir)
        )

        return m

    def _to_protobuf(self) -> Module_pb2.Module:
        proto_module = Module_pb2.Module()
        self._write_protobuf_aux_data(proto_module.aux_data)
        proto_module.binary_path = self.binary_path
        proto_module.isa = self.isa.value
        proto_module.file_format = self.file_format.value
        proto_module.name = self.name
        proto_module.preferred_addr = self.preferred_addr
        proto_module.proxies.extend(p._to_protobuf() for p in self.proxies)
        proto_module.rebase_delta = self.rebase_delta
        proto_module.sections.extend(s._to_protobuf() for s in self.sections)
        proto_module.symbols.extend(s._to_protobuf() for s in self.symbols)
        if self.entry_point is not None:
            proto_module.entry_point = self.entry_point.uuid.bytes
        proto_module.byte_order = self.byte_order.value
        proto_module.uuid = self.uuid.bytes
        return proto_module

    def deep_eq(self, other: object) -> bool:
        # Do not move __eq__. See docstring for Node.deep_eq for more info.
        if not super().deep_eq(other):
            return False
        if not isinstance(other, Module):
            return False
        for attr in (
            "binary_path",
            "isa",
            "byte_order",
            "file_format",
            "name",
            "preferred_addr",
            "rebase_delta",
        ):
            if getattr(self, attr) != getattr(other, attr):
                return False

        for attr in ("proxies", "sections", "symbols"):
            self_nodes = sorted(getattr(self, attr), key=lambda n: n.uuid)
            other_nodes = sorted(getattr(other, attr), key=lambda n: n.uuid)
            if not len(self_nodes) == len(other_nodes):
                return False
            for self_node, other_node in zip(self_nodes, other_nodes):
                if not self_node.deep_eq(other_node):
                    return False

        if self.entry_point is None:
            if other.entry_point is not None:
                return False
        else:
            if not self.entry_point.deep_eq(other.entry_point):
                return False

        return True

    def __repr__(self) -> str:
        return (
            "Module("
            "uuid={uuid!r}, "
            "name={name!r}, "
            "binary_path={binary_path!r}, "
            "isa=Module.{isa!s}, "
            "byte_order=Module.{byte_order!s}, "
            "file_format=Module.{file_format!s}, "
            "preferred_addr={preferred_addr:#x}, "
            "rebase_delta={rebase_delta:#x}, "
            "proxies={proxies!r}, "
            "sections={sections!r}, "
            "symbols={symbols!r}, "
            "entry_point={entry_point!r}, "
            ")".format(**self.__dict__)
        )

    def _index_add(
        self, node: typing.Union[ProxyBlock, Section, Symbol]
    ) -> None:
        if isinstance(node, Symbol):
            self._symbol_name_index[node.name].add(node)
            if node.referent:
                self._symbol_referent_index[node.referent].add(node)

    def _index_discard(
        self, node: typing.Union[ProxyBlock, Section, Symbol]
    ) -> None:
        if isinstance(node, Symbol):
            symbol_set = self._symbol_name_index[node.name]
            symbol_set.discard(node)
            if not symbol_set:
                del self._symbol_name_index[node.name]

            if node.referent:
                symbol_set = self._symbol_referent_index[node.referent]
                symbol_set.discard(node)
                if not symbol_set:
                    del self._symbol_referent_index[node.referent]

    def symbols_named(self, name: str) -> typing.Iterator[Symbol]:
        "Finds all symbols with a given name."
        symbols = self._symbol_name_index.get(name, None)
        if symbols:
            yield from symbols

    @property
    def ir(self) -> typing.Optional["IR"]:
        """The :class:`IR` this module belongs to."""

        return self._ir

    @ir.setter
    def ir(self, value: typing.Optional["IR"]) -> None:
        if self._ir is not None:
            self._ir.modules.remove(self)
        if value is not None:
            value.modules.append(self)

    @property
    def byte_intervals(self) -> typing.Iterator[ByteInterval]:
        """The :class:`ByteInterval`\\s in this module."""

        return itertools.chain.from_iterable(
            s.byte_intervals for s in self.sections
        )

    @property
    def byte_blocks(self) -> typing.Iterator[ByteBlock]:
        """The :class:`ByteBlock`\\s in this module."""

        return itertools.chain.from_iterable(
            s.byte_blocks for s in self.sections
        )

    @property
    def code_blocks(self) -> typing.Iterator[CodeBlock]:
        """The :class:`CodeBlock`\\s in this module."""

        return itertools.chain.from_iterable(
            s.code_blocks for s in self.sections
        )

    @property
    def data_blocks(self) -> typing.Iterator[DataBlock]:
        """The :class:`DataBlock`\\s in this module."""

        return itertools.chain.from_iterable(
            s.data_blocks for s in self.sections
        )

    @property
    def cfg_nodes(self) -> typing.Iterator[CfgNode]:
        """The :class:`CfgNode`\\s in this module."""

        return itertools.chain(self.code_blocks, self.proxies)

    def sections_on(
        self, addrs: typing.Union[int, range]
    ) -> typing.Iterable[Section]:
        """Finds all the sections that overlap an address or range of
        addresses.

        :param addrs: Either a ``range`` object or a single address.
        """

        return nodes_on(self.sections, addrs)

    def sections_at(
        self, addrs: typing.Union[int, range]
    ) -> typing.Iterable[Section]:
        """Finds all the sections that begin at an address or range of
        addresses.

        :param addrs: Either a ``range`` object or a single address.
        """

        return nodes_at(self.sections, addrs)

    def byte_intervals_on(
        self, addrs: typing.Union[int, range]
    ) -> typing.Iterable[ByteInterval]:
        """Finds all the byte intervals that overlap an address or range of
        addresses.

        :param addrs: Either a ``range`` object or a single address.
        """

        return itertools.chain.from_iterable(
            s.byte_intervals_on(addrs) for s in self.sections
        )

    def byte_intervals_at(
        self, addrs: typing.Union[int, range]
    ) -> typing.Iterable[ByteInterval]:
        """Finds all the byte intervals that begin at an address or range of
        addresses.

        :param addrs: Either a ``range`` object or a single address.
        """

        return itertools.chain.from_iterable(
            s.byte_intervals_at(addrs) for s in self.sections
        )

    def byte_blocks_on(
        self, addrs: typing.Union[int, range]
    ) -> typing.Iterable[ByteBlock]:
        """Finds all the byte blocks that overlap an address or range of
        addresses.

        :param addrs: Either a ``range`` object or a single address.
        """

        return itertools.chain.from_iterable(
            s.byte_blocks_on(addrs) for s in self.sections
        )

    def byte_blocks_at(
        self, addrs: typing.Union[int, range]
    ) -> typing.Iterable[ByteBlock]:
        """Finds all the byte blocks that begin at an address or range of
        addresses.

        :param addrs: Either a ``range`` object or a single address.
        """

        return itertools.chain.from_iterable(
            s.byte_blocks_at(addrs) for s in self.sections
        )

    def code_blocks_on(
        self, addrs: typing.Union[int, range]
    ) -> typing.Iterable[CodeBlock]:
        """Finds all the code blocks that overlap an address or range of
        addresses.

        :param addrs: Either a ``range`` object or a single address.
        """

        return itertools.chain.from_iterable(
            s.code_blocks_on(addrs) for s in self.sections
        )

    def code_blocks_at(
        self, addrs: typing.Union[int, range]
    ) -> typing.Iterable[CodeBlock]:
        """Finds all the code blocks that begin at an address or range of
        addresses.

        :param addrs: Either a ``range`` object or a single address.
        """

        return itertools.chain.from_iterable(
            s.code_blocks_at(addrs) for s in self.sections
        )

    def data_blocks_on(
        self, addrs: typing.Union[int, range]
    ) -> typing.Iterable[DataBlock]:
        """Finds all the data blocks that overlap an address or range of
        addresses.

        :param addrs: Either a ``range`` object or a single address.
        """

        return itertools.chain.from_iterable(
            s.data_blocks_on(addrs) for s in self.sections
        )

    def data_blocks_at(
        self, addrs: typing.Union[int, range]
    ) -> typing.Iterable[DataBlock]:
        """Finds all the data blocks that begin at an address or range of
        addresses.

        :param addrs: Either a ``range`` object or a single address.
        """

        return itertools.chain.from_iterable(
            s.data_blocks_at(addrs) for s in self.sections
        )

    def symbolic_expressions_at(
        self, addrs: typing.Union[int, range]
    ) -> typing.Iterable[SymbolicExpressionElement]:
        """Finds all the symbolic expressions that begin at an address or
        range of addresses.

        :param addrs: Either a ``range`` object or a single address.
        :returns: Yields ``(interval, offset, symexpr)`` tuples for every
            symbolic expression in the range.
        """

        return symbolic_expressions_at(self.sections, addrs)

    def _add_to_uuid_cache(self, cache: typing.Dict[UUID, Node]) -> None:
        """Update the UUID cache when this node is added."""

        cache[self.uuid] = self
        for proxy in self.proxies:
            proxy._add_to_uuid_cache(cache)
        for section in self.sections:
            section._add_to_uuid_cache(cache)
        for symbol in self.symbols:
            symbol._add_to_uuid_cache(cache)

    def _remove_from_uuid_cache(self, cache: typing.Dict[UUID, Node]) -> None:
        """Update the UUID cache when this node is removed."""

        del cache[self.uuid]
        for proxy in self.proxies:
            proxy._remove_from_uuid_cache(cache)
        for section in self.sections:
            section._remove_from_uuid_cache(cache)
        for symbol in self.symbols:
            symbol._remove_from_uuid_cache(cache)


================================================
FILE: python/gtirb/node.py
================================================
import typing
from uuid import UUID, uuid4

import typing_extensions
from google.protobuf.message import Message

from .util import DeserializationError

if typing.TYPE_CHECKING:  # pragma: no cover
    # Ignore flake8 "imported but unused" errors.
    from .ir import IR  # noqa: F401


_T = typing.TypeVar("_T", bound="Node")


class _NodeMessage(typing_extensions.Protocol):
    uuid: bytes


class Node:
    """A Node is any GTIRB object which can be referenced by UUID.

    :ivar ~.uuid: The UUID of this Node.
    """

    def __init__(self, uuid: typing.Optional[UUID] = None) -> None:
        """
        :param uuid: The UUID of this ``Node``,
            or None if a new UUID needs generated via :func:`uuid.uuid4`.
            Defaults to None.
        """

        if uuid is None:
            uuid = uuid4()
        self.uuid = uuid

    @classmethod
    def _decode_protobuf(
        cls: typing.Type[_T],
        proto_object: _NodeMessage,
        uuid: UUID,
        ir: typing.Optional["IR"],
    ) -> _T:
        """Decode a Protobuf object to a Python GTIRB object.
        Must be overridden by subclasses.

        :param proto_object: The Protobuf object.
        :param uuid: The UUID of the object.
        """

        raise NotImplementedError  # pragma: no cover

    @classmethod
    def _from_protobuf(
        cls: typing.Type[_T],
        proto_object: _NodeMessage,
        ir: typing.Optional["IR"],
    ) -> _T:
        """Deserialize a Node from Protobuf.

        Performs a cache lookup for the object's UUID in the cache, calling the
        class' _decode_protobuf constructor if cannot find it.
        """

        uuid = UUID(bytes=proto_object.uuid)
        node = None
        if ir is not None:
            cached_node = ir.get_by_uuid(uuid)
            if isinstance(cached_node, cls):
                node = cached_node
            elif cached_node is not None:
                raise DeserializationError(
                    "got %s for UUID %s but expected %s"
                    % (type(cached_node).__name__, uuid, cls.__name__)
                )
        if node is None:
            node = cls._decode_protobuf(proto_object, uuid, ir)
        return node

    def _to_protobuf(self) -> Message:
        """Get a Protobuf representation of ``self``.
        Must be overridden by subclasses.
        """

        raise NotImplementedError  # pragma: no cover

    def deep_eq(self, other: object) -> bool:
        """Check: is ``self`` structurally equal to ``other``?

        This method should be used only when deep structural equality checks
        are actually needed, and not for all equality checks. Typically the
        default implmentation of __eq__, which checks pointer equality, is
        sufficient; Nodes are cached such that references to two Nodes with
        the same UUID refer to the same exact object. Use this method when
        you have manually constructed Nodes that may share the same UUID
        despite being different objects, and you need to check for structural
        equality.
        """

        raise NotImplementedError  # pragma: no cover


================================================
FILE: python/gtirb/offset.py
================================================
from typing import TYPE_CHECKING, NamedTuple, Optional, Union
from uuid import UUID

from .node import Node
from .proto import Offset_pb2
from .util import DeserializationError

if TYPE_CHECKING:  # pragma: no cover
    # Ignore flake8 "imported but unused" errors.
    from .ir import IR  # noqa: F401


class Offset(
    NamedTuple(
        "NamedTuple",
        (("element_id", Union[UUID, Node]), ("displacement", int)),
    )
):
    """
    An Offset describes a location inside a :class:`gtirb.Node`, such as a
    :class:`gtirb.DataBlock` or :class:`gtirb.ByteInterval`.

    :ivar ~.element_id: The :class:`gtirb.Node` containing the location of
            interest.
    :ivar ~.displacement: The offset inside the Node to point to.
    """

    @classmethod
    def _from_protobuf(
        cls, offset: Offset_pb2.Offset, ir: Optional["IR"]
    ) -> "Offset":
        """Decode a Protobuf object to an offset.

        :param offset: The Protobuf object.
        """

        assert ir
        element_id = UUID(bytes=offset.element_id)
        element = ir.get_by_uuid(element_id)
        if not element:
            raise DeserializationError(
                "Offset: UUID %s does not refer to a Node" % element_id
            )
        return cls(element, offset.displacement)

    def _to_protobuf(self) -> Offset_pb2.Offset:
        """Encode this offset into a Protobuf object."""

        proto_offset = Offset_pb2.Offset()
        if isinstance(self.element_id, UUID):
            proto_offset.element_id = self.element_id.bytes
        else:
            proto_offset.element_id = self.element_id.uuid.bytes
        proto_offset.displacement = self.displacement
        return proto_offset


================================================
FILE: python/gtirb/proto/__init__.py
================================================


================================================
FILE: python/gtirb/section.py
================================================
import itertools
import typing
from enum import Enum
from uuid import UUID

from .block import ByteBlock, CodeBlock, DataBlock
from .byteinterval import ByteInterval, SymbolicExpressionElement
from .lazyintervaltree import LazyIntervalTree
from .node import Node, _NodeMessage
from .proto import Section_pb2
from .util import (
    SetWrapper,
    _address_interval,
    _nodes_at_interval_tree,
    _nodes_on_interval_tree,
)

if typing.TYPE_CHECKING:  # pragma: no cover
    # Ignore flake8 "imported but unused" errors.
    from .ir import IR  # noqa: F401
    from .module import Module  # noqa: F401


class Section(Node):
    """Represents a named section of the binary.

    Does not directly store the contents of the section, which are
    kept in a :class:`gtirb.ImageByteMap`.

    :ivar ~.name: The section name (E.g. ".text", ".bss", etc).
    :ivar ~.byte_intervals: The :class:`ByteInterval`\\s in this section.
    :ivar ~.flags: The :class:`Section.Flag`\\s this section has.
    """

    class Flag(Enum):
        """A flag representing a known property of a section."""

        Undefined = Section_pb2.SectionFlag.Value("Section_Undefined")
        """This value is defined for Protobuf compatibility. Do not use."""

        Readable = Section_pb2.SectionFlag.Value("Readable")
        """This section can be read from at runtime."""

        Writable = Section_pb2.SectionFlag.Value("Writable")
        """This section can be written to at runtime."""

        Executable = Section_pb2.SectionFlag.Value("Executable")
        """This section contains executable code."""

        Loaded = Section_pb2.SectionFlag.Value("Loaded")
        """This section is present in memory at runtime."""

        Initialized = Section_pb2.SectionFlag.Value("Initialized")
        """This section has bytes allocated to it in the binary file."""

        ThreadLocal = Section_pb2.SectionFlag.Value("ThreadLocal")
        """This section is created in memory once per thread."""

    class _ByteIntervalSet(SetWrapper[ByteInterval]):
        def __init__(
            self, node: "Section", *args: typing.Iterable[ByteInterval]
        ):
            self._node = node
            super().__init__(*args)

        def add(self, v: ByteInterval) -> None:
            if v._section is not None:
                v._section.byte_intervals.discard(v)
            self._node._index_add(v)
            v._section = self._node
            if self._node.ir is not None:
                v._add_to_uuid_cache(self._node.ir._local_uuid_cache)
            return super().add(v)

        def discard(self, v: ByteInterval) -> None:
            if v not in self:
                return
            self._node._index_discard(v)
            v._section = None
            if self._node.ir is not None:
                v._remove_from_uuid_cache(self._node.ir._local_uuid_cache)
            return super().discard(v)

    def __init__(
        self,
        *,
        name: str = "",
        byte_intervals: typing.Iterable[ByteInterval] = (),
        flags: typing.Iterable["Section.Flag"] = set(),
        uuid: typing.Optional[UUID] = None,
        module: typing.Optional["Module"] = None,
    ):
        """
        :param name: The name of this section.
        :param byte_intervals: The :class:`ByteInterval`\\s in this section.
        :param flags: The :class:`Section.Flag`\\s this section has.
        :param uuid: The UUID of this ``Section``,
            or None if a new UUID needs generated via :func:`uuid.uuid4`.
            Defaults to None.
        :param module: The :class:`Module` this section belongs to.
        """

        super().__init__(uuid)
        self._module: typing.Optional["Module"] = None
        self.name = name

        # Both byte_intervals and _interval_index must exist before adding any
        # intervals.
        self.byte_intervals = Section._ByteIntervalSet(self)
        self._interval_index = LazyIntervalTree[int, ByteInterval](
            self.byte_intervals, _address_interval
        )
        self.byte_intervals.update(byte_intervals)

        self.flags = set(flags)

        # Use the property setter to ensure correct invariants.
        self.module = module

    def _index_add(self, byte_interval: ByteInterval) -> None:
        self._interval_index.add(byte_interval)

    def _index_discard(self, byte_interval: ByteInterval) -> None:
        self._interval_index.discard(byte_interval)

    @classmethod
    def _decode_protobuf(
        cls,
        proto_section: _NodeMessage,
        uuid: UUID,
        ir: typing.Optional["IR"],
    ) -> "Section":
        assert ir
        assert isinstance(proto_section, Section_pb2.Section)
        s = cls(
            name=proto_section.name,
            flags=(Section.Flag(f) for f in proto_section.section_flags),
            uuid=uuid,
        )
        s._add_to_uuid_cache(ir._local_uuid_cache)
        s.byte_intervals.update(
            ByteInterval._from_protobuf(bi, ir)
            for bi in proto_section.byte_intervals
        )
        return s

    def _to_protobuf(self) -> Section_pb2.Section:
        """Get a Protobuf representation of ``self``."""

        proto_section = Section_pb2.Section()
        proto_section.uuid = self.uuid.bytes
        proto_section.name = self.name
        proto_section.byte_intervals.extend(
            bi._to_protobuf() for bi in self.byte_intervals
        )
        proto_section.section_flags.extend(f.value for f in self.flags)
        return proto_section

    def deep_eq(self, other: object) -> bool:
        # Do not move __eq__. See docstring for Node.deep_eq for more info.
        if not isinstance(other, Section):
            return False
        return (
            self.uuid == other.uuid
            and self.name == other.name
            and len(self.byte_intervals) == len(other.byte_intervals)
            and all(
                self_node.deep_eq(other_node)
                for self_node, other_node in zip(
                    sorted(self.byte_intervals, key=lambda bi: bi.uuid),
                    sorted(other.byte_intervals, key=lambda bi: bi.uuid),
                )
            )
            and self.flags == other.flags
        )

    def __repr__(self) -> str:
        return (
            "Section("
            "uuid={uuid!r}, "
            "name={name!r}, "
            "byte_intervals={byte_intervals!r}, "
            "flags=({pretty_flags}), "
            ")".format(
                pretty_flags=", ".join(
                    "Section." + str(f) for f in self.flags
                ),
                **self.__dict__,
            )
        )

    @property
    def module(self) -> typing.Optional["Module"]:
        """The :class:`Module` this section belongs to."""

        return self._module

    @module.setter
    def module(self, value: typing.Optional["Module"]) -> None:
        if self._module is not None:
            self._module.sections.discard(self)
        if value is not None:
            value.sections.add(self)

    @property
    def byte_blocks(self) -> typing.Iterator[ByteBlock]:
        """The :class:`ByteBlock`\\s in this section."""

        return itertools.chain.from_iterable(
            bi.blocks for bi in self.byte_intervals
        )

    @property
    def code_blocks(self) -> typing.Iterator[CodeBlock]:
        """The :class:`CodeBlock`\\s in this section."""

        return (b for b in self.byte_blocks if isinstance(b, CodeBlock))

    @property
    def data_blocks(self) -> typing.Iterator[DataBlock]:
        """The :class:`DataBlock`\\s in this section."""

        return (b for b in self.byte_blocks if isinstance(b, DataBlock))

    @property
    def address(self) -> typing.Optional[int]:
        """Get the address of this section, if known.

        The address is calculated from the :class:`ByteInterval` objects in
        this section. More specifically, if the address of all byte intervals
        in this section are fixed, then it will return the address of the
        interval lowest in memory. If any one interval does not have an address
        then this will be ``None``, as the address is not calculable in that
        case. Note that a section with no intervals in it has no address or
        size, so it will be ``None`` in that case.
        """

        index = self._interval_index.get()
        if 0 < len(index) == len(self.byte_intervals):
            return index.begin()

        return None

    @property
    def size(self) -> typing.Optional[int]:
        """Get the size of this section, if known.

        The address is calculated from the :class:`ByteInterval` objects in
        this section. More specifically, if the address of all byte intervals
        in this section are fixed, then it will return the difference between
        the lowest and highest address among the intervals. If any one interval
        does not have an address, then this will be ``None``, as the size is
        not calculable in that case. Note that a section with no intervals in
        it has no address or size, so it will be ``None`` in that case.
        """

        index = self._interval_index.get()
        if 0 < len(index) == len(self.byte_intervals):
            return index.span() - 1

        return None

    def byte_intervals_on(
        self, addrs: typing.Union[int, range]
    ) -> typing.Iterable[ByteInterval]:
        """Finds all the byte intervals that overlap an address or range of
        addresses.

        :param addrs: Either a ``range`` object or a single address.
        """

        return _nodes_on_interval_tree(self._interval_index.get(), addrs)

    def byte_intervals_at(
        self, addrs: typing.Union[int, range]
    ) -> typing.Iterable[ByteInterval]:
        """Finds all the byte intervals that begin at an address or range of
        addresses.

        :param addrs: Either a ``range`` object or a single address.
        """

        return _nodes_at_interval_tree(self._interval_index.get(), addrs)

    def byte_blocks_on(
        self, addrs: typing.Union[int, range]
    ) -> typing.Iterable[ByteBlock]:
        """Finds all the byte blocks that overlap an address or range of
        addresses.

        :param addrs: Either a ``range`` object or a single address.
        """

        for interval in self.byte_intervals_on(addrs):
            yield from interval.byte_blocks_on(addrs)

    def byte_blocks_at(
        self, addrs: typing.Union[int, range]
    ) -> typing.Iterable[ByteBlock]:
        """Finds all the byte blocks that begin at an address or range of
        addresses.

        :param addrs: Either a ``range`` object or a single address.
        """

        for interval in self.byte_intervals_on(addrs):
            yield from interval.byte_blocks_at(addrs)

    def code_blocks_on(
        self, addrs: typing.Union[int, range]
    ) -> typing.Iterable[CodeBlock]:
        """Finds all the code blocks that overlap an address or range of
        addresses.

        :param addrs: Either a ``range`` object or a single address.
        """

        return (
            block
            for block in self.byte_blocks_on(addrs)
            if isinstance(block, CodeBlock)
        )

    def code_blocks_at(
        self, addrs: typing.Union[int, range]
    ) -> typing.Iterable[CodeBlock]:
        """Finds all the code blocks that begin at an address or range of
        addresses.

        :param addrs: Either a ``range`` object or a single address.
        """

        return (
            block
            for block in self.byte_blocks_at(addrs)
            if isinstance(block, CodeBlock)
        )

    def data_blocks_on(
        self, addrs: typing.Union[int, range]
    ) -> typing.Iterable[DataBlock]:
        """Finds all the data blocks that overlap an address or range of
        addresses.

        :param addrs: Either a ``range`` object or a single address.
        """

        return (
            block
            for block in self.byte_blocks_on(addrs)
            if isinstance(block, DataBlock)
        )

    def data_blocks_at(
        self, addrs: typing.Union[int, range]
    ) -> typing.Iterable[DataBlock]:
        """Finds all the data blocks that begin at an address or range of
        addresses.

        :param addrs: Either a ``range`` object or a single address.
        """

        return (
            block
            for block in self.byte_blocks_at(addrs)
            if isinstance(block, DataBlock)
        )

    def symbolic_expressions_at(
        self, addrs: typing.Union[int, range]
    ) -> typing.Iterable[SymbolicExpressionElement]:
        """Finds all the symbolic expressions that begin at an address or
        range of addresses.

        :param addrs: Either a ``range`` object or a single address.
        :returns: Yields ``(interval, offset, symexpr)`` tuples for every
            symbolic expression in the range.
        """

        for interval in self.byte_intervals_on(addrs):
            yield from interval.symbolic_expressions_at(addrs)

    def _add_to_uuid_cache(self, cache: typing.Dict[UUID, Node]) -> None:
        """Update the UUID cache when this node is added."""

        cache[self.uuid] = self
        for bi in self.byte_intervals:
            bi._add_to_uuid_cache(cache)

    def _remove_from_uuid_cache(self, cache: typing.Dict[UUID, Node]) -> None:
        """Update the UUID cache when this node is removed."""

        del cache[self.uuid]
        for bi in self.byte_intervals:
            bi._remove_from_uuid_cache(cache)

    @property
    def ir(self) -> typing.Optional["IR"]:
        """Get the IR this node ultimately belongs to."""
        if self.module is None:
            return None
        return self.module.ir


================================================
FILE: python/gtirb/serialization.py
================================================
import io
import struct
from re import findall
from typing import (
    Any,
    BinaryIO,
    Callable,
    Collection,
    Dict,
    Iterable,
    Mapping,
    Optional,
    Sequence,
    Set,
    Tuple,
    Type,
    Union,
)
from uuid import UUID

from .node import Node
from .offset import Offset

CacheLookupFn = Optional[Callable[[UUID], Optional[Node]]]


class CodecError(Exception):
    """Base class for codec exceptions."""


class DecodeError(CodecError):
    """An exception during decoding."""


class EncodeError(CodecError):
    """An exception during encoding."""


class TypeNameError(EncodeError):
    """A type name is malformed."""

    def __init__(self, hint: str) -> None:
        super().__init__("malformed type name: '%s'" % (hint))


class UnknownCodecError(CodecError):
    """An unknown codec name is encountered.
    Caught and handled by the top-level codec methods.

    :param name: the name of the unknown codec
    """

    def __init__(self, name: str) -> None:
        self.name = name


class SubtypeTree:
    """A type hint representing a parsed serialization type name.
    A ``SubtypeTree`` is has two items: A ``str`` giving
    the name of the type and a Sequence of type parameters
    (which are also ``SubtypeTree``\\s). For example, the following are all
    valid ``SubtypeTree``\\s:

    >>> SubtypeTree('string', ())
    >>> SubtypeTree('sequence', (SubtypeTree('UUID',()),))
    >>> SubtypeTree(
        'mapping', (
            SubtypeTree('string', ()),
            SubtypeTree('set', (SubtypeTree('UUID', ()),))
        )
    )
    """

    def __init__(self, name: str, subtypes: Sequence["SubtypeTree"]) -> None:
        self.name = name
        self.subtypes = subtypes

    def __eq__(self, other: object) -> bool:
        if isinstance(other, SubtypeTree):
            return self.name == other.name and self.subtypes == other.subtypes
        if isinstance(other, tuple):
            return (self.name, self.subtypes) == other
        return False


class Variant:
    # Because the Variant can contain arbitrary data, depending on the context
    # in which it is used, it has type Any. This requires an exception to the
    # project-wide mypy configuration that disallows Any.
    def __init__(self, index: int, val: Any):  # type: ignore[misc]
        self.index = index
        self.val = val

    def __eq__(self, other: object) -> bool:
        if isinstance(other, Variant):
            return self.index == other.index and self.val == other.val
        return False


class Codec:
    """The base class for codecs."""

    @staticmethod
    def decode(
        raw_bytes: BinaryIO,
        *,
        serialization: "Serialization",
        subtypes: Sequence[SubtypeTree],
        get_by_uuid: CacheLookupFn = None,
    ) -> object:
        """Decode the specified raw data into a Python object.

        :param raw_bytes: The BytesIO object to be decoded.
        :param serialization: A Serialization instance used to invoke
            other codecs if needed.
        :param subtypes: The parsed type of this object.
        :param get_by_uuid: A function to look up nodes by UUID.
        :returns: A new Python object, as decoded from ``raw_bytes``.
        """

        raise NotImplementedError  # pragma: no cover

    @staticmethod
    def encode(
        out: BinaryIO,
        item: object,
        *,
        serialization: "Serialization",
        subtypes: Sequence[SubtypeTree],
    ) -> None:
        """Encode an item, writing the serialized object to ``out``.

        :param out: A binary stream to serialize to.
        :param item: The arbitrary Python object to encode.
        :param serialization: A Serialization instance, used to invoke
            other codecs if needed.
        :param subtypes: The parsed type of this object.
        """

        raise NotImplementedError  # pragma: no cover


class MappingCodec(Codec):
    """A Codec for mapping<K,V> entries. Implemented via ``dict``."""

    @staticmethod
    def decode(
        raw_bytes: BinaryIO,
        *,
        serialization: "Serialization",
        subtypes: Sequence[SubtypeTree],
        get_by_uuid: Optional[CacheLookupFn] = None,
    ) -> Mapping[object, object]:
        try:
            key_type, val_type = subtypes
        except (TypeError, ValueError):
            raise DecodeError(
                "could not unpack mapping types: %s" % str(subtypes)
            )
        mapping = dict()
        mapping_len = Uint64Codec.decode(raw_bytes)
        for _ in range(mapping_len):
            key = serialization._decode_tree(raw_bytes, key_type, get_by_uuid)
            val = serialization._decode_tree(raw_bytes, val_type, get_by_uuid)
            mapping[key] = val
        return mapping

    @staticmethod
    def encode(
        out: BinaryIO,
        mapping: object,
        *,
        serialization: "Serialization",
        subtypes: Sequence[SubtypeTree],
    ) -> None:
        if not isinstance(mapping, Mapping):
            raise EncodeError("Mapping codec only supports Mappings")
        try:
            key_type, val_type = subtypes
        except (TypeError, ValueError):
            raise EncodeError(
                "could not unpack mapping types: %s" % str(subtypes)
            )
        Uint64Codec.encode(out, len(mapping))
        for key, val in mapping.items():
            serialization._encode_tree(out, key, key_type)
            serialization._encode_tree(out, val, val_type)


class OffsetCodec(Codec):
    """A Codec for :class:`gtirb.Offset` objects,
    containing a UUID and a displacement.
    """

    @staticmethod
    def decode(
        raw_bytes: BinaryIO,
        *,
        serialization: "Serialization" = None,
        subtypes: Sequence[SubtypeTree] = (),
        get_by_uuid: Optional[CacheLookupFn] = None,
    ) -> Offset:
        if subtypes != ():
            raise DecodeError("Offset should have no subtypes")
        element_uuid = UUIDCodec.decode(raw_bytes, get_by_uuid=get_by_uuid)
        displacement = Uint64Codec.decode(raw_bytes)

        return Offset(element_uuid, displacement)

    @staticmethod
    def encode(
        out: BinaryIO,
        val: object,
        *,
        serialization: "Serialization" = None,
        subtypes: Sequence[SubtypeTree] = (),
    ) -> None:
        if not isinstance(val, Offset):
            raise EncodeError("Offset codec only supports Offsets")
        if subtypes != ():
            raise EncodeError("Offset should have no subtypes")
        UUIDCodec.encode(out, val.element_id)
        Uint64Codec.encode(out, val.displacement)


class SequenceCodec(Codec):
    """A Codec for sequence<T> entries. Implemented via ``list``."""

    @staticmethod
    def decode(
        raw_bytes: BinaryIO,
        *,
        serialization: "Serialization",
        subtypes: Sequence[SubtypeTree],
        get_by_uuid: Optional[CacheLookupFn] = None,
    ) -> Sequence[object]:
        try:
            (subtype,) = subtypes
        except (TypeError, ValueError) as e:
            raise DecodeError("could not unpack sequence type: %s" % str(e))
        sequence = list()
        sequence_len = Uint64Codec.decode(raw_bytes)
        for _ in range(sequence_len):
            sequence.append(
                serialization._decode_tree(raw_bytes, subtype, get_by_uuid)
            )
        return sequence

    @staticmethod
    def encode(
        out: BinaryIO,
        sequence: object,
        *,
        serialization: "Serialization",
        subtypes: Sequence[SubtypeTree],
    ) -> None:
        if not isinstance(sequence, Sequence):
            raise EncodeError("Sequence codec only supports Collections")
        try:
            (subtype,) = subtypes
        except (TypeError, ValueError) as e:
            raise EncodeError("could not unpack sequence type: %s" % str(e))
        Uint64Codec.encode(out, len(sequence))
        for item in sequence:
            serialization._encode_tree(out, item, subtype)


class SetCodec(Codec):
    """A Codec for set<T> entries. Implemented via ``set``."""

    @staticmethod
    def decode(
        raw_bytes: BinaryIO,
        *,
        serialization: "Serialization",
        subtypes: Sequence[SubtypeTree],
        get_by_uuid: Optional[CacheLookupFn] = None,
    ) -> Set[object]:
        try:
            (subtype,) = subtypes
        except (TypeError, ValueError) as e:
            raise DecodeError("could not unpack set type: %s" % str(e))
        decoded_set = set()
        set_len = Uint64Codec.decode(raw_bytes)
        for _ in range(set_len):
            decoded_set.add(
                serialization._decode_tree(raw_bytes, subtype, get_by_uuid)
            )
        return decoded_set

    @staticmethod
    def encode(
        out: BinaryIO,
        items: object,
        *,
        serialization: "Serialization",
        subtypes: Sequence[SubtypeTree],
    ) -> None:
        if not isinstance(items, Collection):
            raise EncodeError("Set codec only supports Collections")
        try:
            (subtype,) = subtypes
        except (TypeError, ValueError) as e:
            raise EncodeError("could not unpack set type: %s" % str(e))
        Uint64Codec.encode(out, len(items))
        for item in items:
            serialization._encode_tree(out, item, subtype)


class TupleCodec(Codec):
    """A Codec for tuple<...> entries. Implemented via ``tuple``."""

    @staticmethod
    def decode(
        raw_bytes: BinaryIO,
        *,
        serialization: "Serialization",
        subtypes: Sequence[SubtypeTree],
        get_by_uuid: Optional[CacheLookupFn] = None,
    ) -> Tuple[object, ...]:
        # The length of a tuple is not contained in the Protobuf
        # representation, so error checking cannot be done here.
        decoded_list = list()
        for subtype in subtypes:
            decoded_list.append(
                serialization._decode_tree(raw_bytes, subtype, get_by_uuid)
            )
        return tuple(decoded_list)

    @staticmethod
    def encode(
        out: BinaryIO,
        items: object,
        *,
        serialization: "Serialization",
        subtypes: Sequence[SubtypeTree],
    ) -> None:
        if not isinstance(items, Collection):
            raise EncodeError("Tuple codec only supports Collections")
        if len(items) != len(subtypes):
            raise EncodeError("length of tuple does not match subtype count")
        for item, subtype in zip(items, subtypes):
            serialization._encode_tree(out, item, subtype)


class StringCodec(Codec):
    """A Codec for strings."""

    @staticmethod
    def decode(
        raw_bytes: BinaryIO,
        *,
        serialization: "Serialization" = None,
        subtypes: Sequence[SubtypeTree] = (),
        get_by_uuid: Optional[CacheLookupFn] = None,
    ) -> str:
        if subtypes != tuple():
            raise DecodeError("string should have no subtypes")
        size = Uint64Codec.decode(raw_bytes)
        return raw_bytes.read(size).decode("utf-8")

    @staticmethod
    def encode(
        out: BinaryIO,
        val: object,
        *,
        serialization: "Serialization" = None,
        subtypes: Sequence[SubtypeTree] = (),
    ) -> None:
        if not isinstance(val, str):
            raise EncodeError("String codec only supports strings")
        if subtypes != ():
            raise EncodeError("string should have no subtypes")
        Uint64Codec.encode(out, len(val))
        out.write(val.encode())


class BoolCodec(Codec):
    """A Codec for bool."""

    @staticmethod
    def decode(
        raw_bytes: BinaryIO,
        *,
        serialization: "Serialization" = None,
        subtypes: Sequence[SubtypeTree] = (),
        get_by_uuid: Optional[CacheLookupFn] = None,
    ) -> bool:
        if subtypes != tuple():
            raise DecodeError("bool should have no subtypes")
        return bool(raw_bytes.read(1) != b"\x00")

    @staticmethod
    def encode(
        out: BinaryIO,
        val: object,
        *,
        serialization: "Serialization" = None,
        subtypes: Sequence[SubtypeTree] = (),
    ) -> None:
        if not isinstance(val, bool):
            raise EncodeError("Bool codec only supports bool")
        if subtypes != ():
            raise EncodeError("bool should have no subtypes")
        out.write(bytes([val]))


class IntegerCodec(Codec):
    """Generic base class for integer-based Codecs"""

    typname: str
    bytesize: int
    signed: bool

    @classmethod
    def decode(
        cls,
        raw_bytes: BinaryIO,
        *,
        serialization: "Serialization" = None,
        subtypes: Sequence[SubtypeTree] = (),
        get_by_uuid: Optional[CacheLookupFn] = None,
    ) -> int:
        if subtypes != ():
            raise DecodeError(f"{cls.typname} should have no subtypes")
        return int.from_bytes(
            raw_bytes.read(cls.bytesize), byteorder="little", signed=cls.signed
        )

    @classmethod
    def encode(
        cls,
        out: BinaryIO,
        val: object,
        *,
        serialization: "Serialization" = None,
        subtypes: Sequence[SubtypeTree] = (),
    ) -> None:
        if not isinstance(val, int):
            raise EncodeError("Integer codec only supports integers")
        if subtypes != ():
            raise EncodeError(f"{cls.typname} should have no subtypes")
        out.write(
            val.to_bytes(cls.bytesize, byteorder="little", signed=cls.signed)
        )


class Uint64Codec(IntegerCodec):
    """A Codec for 64-bit unsigned integers."""

    typname = "uint64_t"
    bytesize = 8
    signed = False


class Uint32Codec(IntegerCodec):
    """A Codec for 32-bit unsigned integers."""

    typname = "uint32_t"
    bytesize = 4
    signed = False


class Uint16Codec(IntegerCodec):
    """A Codec for 16-bit unsigned integers."""

    typname = "uint16_t"
    bytesize = 2
    signed = False


class Uint8Codec(IntegerCodec):
    """A Codec for 8-bit unsigned integers."""

    typname = "uint8_t"
    bytesize = 1
    signed = False


class Int64Codec(IntegerCodec):
    """A Codec for 64-bit signed integers."""

    typname = "int64_t"
    bytesize = 8
    signed = True


class Int32Codec(IntegerCodec):
    """A Codec for 32-bit signed integers."""

    typname = "int32_t"
    bytesize = 4
    signed = True


class Int16Codec(IntegerCodec):
    """A Codec for 16-bit signed integers."""

    typname = "int16_t"
    bytesize = 2
    signed = True


class Int8Codec(IntegerCodec):
    """A Codec for 8-bit signed integers."""

    typname = "int8_t"
    bytesize = 1
    signed = True


class FloatCodec(Codec):
    """Generic base class for float-based Codecs"""

    typname: str
    bytesize: int
    struct_format: str

    @classmethod
    def decode(
        cls,
        raw_bytes: BinaryIO,
        *,
        serialization: "Serialization" = None,
        subtypes: Sequence[SubtypeTree] = (),
        get_by_uuid: Optional[CacheLookupFn] = None,
    ) -> float:
        if subtypes != ():
            raise DecodeError(f"{cls.typname} should have no subtypes")

        return struct.unpack(cls.struct_format, raw_bytes.read(cls.bytesize))[
            0
        ]

    @classmethod
    def encode(
        cls,
        out: BinaryIO,
        val: object,
        *,
        serialization: "Serialization" = None,
        subtypes: Sequence[SubtypeTree] = (),
    ) -> None:
        if not isinstance(val, float):
            raise EncodeError("Float codec only supports floats")
        if subtypes != ():
            raise EncodeError(f"{cls.typname} should have no subtypes")

        out.write(struct.pack(cls.struct_format, val))


class Float32Codec(FloatCodec):
    typname = "float"
    bytesize = 4
    struct_format = "<f"


class Float64Codec(FloatCodec):
    typname = "double"
    bytesize = 8
    struct_format = "<d"


class UUIDCodec(Codec):
    """A Codec for raw UUIDs or Nodes.

    Decoding a UUID first checks the Node cache for an object with the
    corresponding UUID, and either returns the object it hits or a new
    raw UUID.
    """

    @staticmethod
    def decode(
        raw_bytes: BinaryIO,
        *,
        serialization: "Serialization" = None,
        subtypes: Sequence[SubtypeTree] = (),
        get_by_uuid: Optional[CacheLookupFn] = None,
    ) -> Union[UUID, Node]:
        if subtypes != ():
            raise DecodeError("UUID should have no subtypes")
        uuid = UUID(bytes=raw_bytes.read(16))
        existing_node = None if get_by_uuid is None else get_by_uuid(uuid)
        return uuid if existing_node is None else existing_node

    @staticmethod
    def encode(
        out: BinaryIO,
        val: object,
        *,
        serialization: "Serialization" = None,
        subtypes: Sequence[SubtypeTree] = (),
    ) -> None:
        if subtypes != ():
            raise EncodeError("UUID should have no subtypes")
        if isinstance(val, Node):
            out.write(val.uuid.bytes)
        elif isinstance(val, UUID):
            out.write(val.bytes)
        else:
            raise EncodeError("UUID codec only supports UUIDs or Nodes")


class VariantCodec(Codec):
    """A Codec for variant<Ts...> entries.

    An encoded record containg two part:
    index - position of member of variant's list
    value - encoded values of selected member
    """

    @staticmethod
    def decode(
        raw_bytes: BinaryIO,
        *,
        serialization: "Serialization",
        subtypes: Sequence[SubtypeTree] = (),
        get_by_uuid: Optional[CacheLookupFn] = None,
    ) -> Variant:
        index = int.from_bytes(
            raw_bytes.read(8), byteorder="little", signed=False
        )
        val = serialization._decode_tree(
            raw_bytes, subtypes[index], get_by_uuid
        )
        return Variant(index, val)

    @staticmethod
    def encode(
        out: BinaryIO,
        variant: object,
        *,
        serialization: "Serialization",
        subtypes: Sequence[SubtypeTree] = (),
    ) -> None:
        if not isinstance(variant, Variant):
            raise EncodeError("Variant codec only supports variants")
        # variant is a named tuple containg index and value
        # writing the index
        out.write(variant.index.to_bytes(8, byteorder="little"))
        # writing the value
        serialization._encode_tree(out, variant.val, subtypes[variant.index])


class UnknownData(bytes):
    """This class is a blob of bytes representing data with an unknown type.
    Generated by :func:`gtirb.Serialization.decode` when it encounters
    the name of an unknown codec. Use only at the top level of an auxdata.
    """


class Serialization:
    """Manages codecs used to serialize and deserialize GTIRB objects.

    The :meth:`gtirb.Serialization.decode` method of
    :attr:`gtirb.AuxData.serializer` is called when GTIRB AuxData is loaded via
    :meth:`gtirb.IR.load_protobuf`, and the :meth:`gtirb.Serialization.encode`
    method of :attr:`gtirb.AuxData.serializer` is called when GTIRB AuxData is
    saved to file via :meth:`gtirb.IR.save_protobuf`. You can alter the
    encoding and decoding of AuxData values via
    :attr:`gtirb.Serialization.codecs`. To do this, create a new subclass of
    :class:`gtirb.serialization.Codec` and add it to
    :attr:`gtirb.Serialization.codecs`:

    >>> gtirb.AuxData.serializer.codecs['my_custom_type'] = MyCustomCodec

    This example registers a new type name, ``my_custom_type``, and associate
    it with a new codec, ``MyCustomCodec``.

    :ivar ~.codecs: A mapping of type names to codecs. Codecs can be added
        or overridden using this dictionary.
    """

    def __init__(self) -> None:
        """Initialize with the built-in `gtirb.serialization.Codec`
        subclasses.
        """

        self.codecs: Dict[str, Type[Codec]] = {
            "Addr": Uint64Codec,
            "bool": BoolCodec,
            "Offset": OffsetCodec,
            "int64_t": Int64Codec,
            "int32_t": Int32Codec,
            "int16_t": Int16Codec,
            "int8_t": Int8Codec,
            "float": Float32Codec,
            "double": Float64Codec,
            "mapping": MappingCodec,
            "sequence": SequenceCodec,
            "set": SetCodec,
            "string": StringCodec,
            "tuple": TupleCodec,
            "uint64_t": Uint64Codec,
            "uint32_t": Uint32Codec,
            "uint16_t": Uint16Codec,
            "uint8_t": Uint8Codec,
            "UUID": UUIDCodec,
            "variant": VariantCodec,
        }

    def _decode_tree(
        self,
        raw_bytes: BinaryIO,
        type_tree: SubtypeTree,
        get_by_uuid: CacheLookupFn,
    ) -> object:
        """Decode the data in ``raw_bytes`` given a parsed type tree.

        :param raw_bytes: The binary stream to read bytes from.
        :param type_tree: The parsed type of the object encoded by
            ``raw_bytes``.
        """

        if type_tree.name not in self.codecs:
            raise UnknownCodecError(type_tree.name)
        codec = self.codecs[type_tree.name]
        return codec.decode(
            raw_bytes,
            serialization=self,
            subtypes=type_tree.subtypes,
            get_by_uuid=get_by_uuid,
        )

    def _encode_tree(
        self, out: BinaryIO, val: object, type_tree: SubtypeTree
    ) -> None:
        """Encode the data in ``val`` given a parsed type tree.

        :param out: A binary stream to write bytes to.
        :param val: The :class:`gtirb.AuxData` to encode.
        :param type_tree: The parsed type to encode ``val`` as.
        """

        if type_tree.name not in self.codecs:
            raise UnknownCodecError(type_tree.name)
        codec = self.codecs[type_tree.name]
        return codec.encode(
            out, val, serialization=self, subtypes=type_tree.subtypes
        )

    @staticmethod
    def _parse_type(type_name: str) -> SubtypeTree:
        """Given an encoded aux_data type_name, generate its parse tree.

        >>> _parse_type('foo')
        ('foo', ())

        >>> _parse_type('foo<bar>')
        ('foo', (('bar',()),))

        >>> _parse_type('foo<bar<baz>>')
        ('foo', (('bar', (('baz', ()),)),))

        :param type_name: The type name to parse into a ``SubtypeTree``.
        """
        tokens = findall("[^<>,]+|<|>|,", type_name)

        def parse(
            tokens: Sequence[str],
            tree: Iterable[SubtypeTree],
        ) -> Tuple[Tuple[SubtypeTree, ...], Sequence[None]]:
            tree = list(tree)
            # It is an error to parse nothing
            if len(tokens) == 0:
                raise TypeNameError(type_name)
            first_token, *tail = tokens

            # The first token should be a name
            if first_token in {"<", ">", ","}:
                raise TypeNameError(type_name)

            # Base case
            if len(tail) == 0:
                tree.append(SubtypeTree(first_token, ()))
                return tuple(tree), []
            next_token, *tail = tail

            # No subtypes
            if next_token == ",":
                tree.append(SubtypeTree(first_token, ()))

            # Parse subtypes
            if next_token == "<":
                # Extract just the subtype tokens and parse them
                stack = ["<"]
                subtype_tokens = list()
                remaining_tokens = list()
                for t in tail:
                    if len(stack) == 0:
                        remaining_tokens.append(t)
                        continue
                    if t == "<":
                        stack.append(t)
                    elif t == ">":
                        stack.pop()
                    subtype_tokens.append(t)
                if len(stack) > 0 or subtype_tokens[-1] != ">":
                    raise TypeNameError(type_name)
                subtypes, remaining = parse(subtype_tokens[:-1], [])
                # Parsing should consume all subtype tokens
                if len(remaining) != 0:
                    raise TypeNameError(type_name)
                tree.append(SubtypeTree(first_token, subtypes))
                # Finish if all tokens are consumed
                if len(remaining_tokens) == 0:
                    return tuple(tree), []
                next_token, *tail = remaining_tokens

            # If the next token is a comma, parse next
            if next_token == ",":
                return parse(tail, tree)

            # None of the rules match, error
            raise TypeNameError(type_name)

        # There should only be one item at the root of the tree
        try:
            (parse_tree,) = parse(tokens, [])[0]
        except ValueError:
            raise TypeNameError(type_name)
        return parse_tree

    def decode(
        self,
        raw_bytes: Union[bytes, bytearray, memoryview, BinaryIO],
        type_name: str,
        get_by_uuid: CacheLookupFn = None,
    ) -> object:
        """Decode a :class:`gtirb.AuxData` of the specified type
        from the specified byte stream.

        :param raw_bytes: The byte stream from which to read the encoded value.
        :param type_name: The type name of the object encoded by ``raw_bytes``.
        :param get_by_uuid: A function to look up nodes by UUID.
        :returns: The object encoded by ``raw_bytes``.
        """

        parse_tree = Serialization._parse_type(type_name)
        all_bytes = None
        if isinstance(raw_bytes, (bytes, bytearray, memoryview)):
            all_bytes = raw_bytes
        else:
            all_bytes = raw_bytes.read()
        try:
            return self._decode_tree(
                io.BytesIO(all_bytes), parse_tree, get_by_uuid
            )
        except UnknownCodecError:
            # we found an unknwon codec; the entire data structure can't be
            # parsed; return a blob of bytes
            return UnknownData(all_bytes)

    def encode(self, out: BinaryIO, val: object, type_name: str) -> None:
        """Encodes the value of an AuxData value to bytes.

        :param out: A binary stream to write bytes to.
        :param val: The :class:`gtirb.AuxData` to encode.
        :param type_name: The type name of the value encapsulated
            by the :class:`gtirb.AuxData`.
        """

        if isinstance(val, UnknownData):
            # it was a blob of bytes because of a decoding problem;
            # just write the whole thing out
            out.write(val)
            return
        parse_tree = Serialization._parse_type(type_name)
        try:
            self._encode_tree(out, val, parse_tree)
        except UnknownCodecError as e:
            # rethrow UnknownCodecError, because we were supposed to catch it
            # via UnknownData. This means the user manually wrote a bad type.
            raise EncodeError("unknown codec: %s" % e.name)


================================================
FILE: python/gtirb/symbol.py
================================================
import typing
from uuid import UUID

from .block import Block
from .node import Node, _NodeMessage
from .proto import Symbol_pb2
from .util import DeserializationError, _IndexedAttribute

if typing.TYPE_CHECKING:  # pragma: no cover
    # Ignore flake8 "imported but unused" errors.
    from .ir import IR  # noqa: F401
    from .module import Module  # noqa: F401


Payload = typing.Union[Block, int]
"""A type hint representing the possible Symbol payloads."""


class Symbol(Node):
    """Represents a symbol, which maps a name to an object in the IR.

    :ivar ~.name: The name of this symbol.
    :ivar ~.at_end: True if this symbol is at the end of its referent, rather
        than at the beginning. Has no meaning for integral symbols.
    """

    name = _IndexedAttribute[str]()(lambda self: self.module)
    _payload = _IndexedAttribute[typing.Optional[Payload]]()(
        lambda self: self.module
    )

    def __init__(
        self,
        name: str,
        uuid: typing.Optional[UUID] = None,
        payload: typing.Optional[Payload] = None,
        at_end: bool = False,
        module: typing.Optional["Module"] = None,
    ):
        """
        :param name: The name of this symbol.
        :param uuid: The UUID of this ``Symbol``,
            or None if a new UUID needs generated via :func:`uuid.uuid4`.
            Defaults to None.
        :param payload: The value this symbol points to.
            May be an address, a Node, or None.
        :param at_end: True if this symbol is at the end of its referent,
            rather than at the beginning.
        :param module: The :class:`Module` this symbol belongs to.
        """

        super().__init__(uuid)
        self._module: typing.Optional["Module"] = None
        self.name = name
        self.at_end = at_end
        self._payload = payload
        # Use the property setter to ensure correct invariants.
        self.module = module

    @property
    def value(self) -> typing.Optional[int]:
        """The value of a Symbol, which is an integer or None.
        ``value`` and ``referent`` are mutually exclusive.
        """

        if not isinstance(self._payload, Block):
            return self._payload
        return None

    @value.setter
    def value(self, value: typing.Optional[int]) -> None:
        self._payload = value

    @property
    def referent(self) -> typing.Optional[Block]:
        """The object referred to by a Symbol, which is :class:`Block`
        or None. ``value`` and ``referent`` are mutually exclusive.
        """

        if isinstance(self._payload, Block):
            return self._payload
        return None

    @referent.setter
    def referent(self, referent: typing.Optional[Block]) -> None:
        self._payload = referent

    @classmethod
    def _decode_protobuf(
        cls,
        proto_symbol: _NodeMessage,
        uuid: UUID,
        ir: typing.Optional["IR"],
    ) -> "Symbol":
        assert ir
        assert isinstance(proto_symbol, Symbol_pb2.Symbol)
        symbol = cls(
            name=proto_symbol.name, at_end=proto_symbol.at_end, uuid=uuid
        )
        if proto_symbol.HasField("value"):
            symbol.value = proto_symbol.value
        if proto_symbol.HasField("referent_uuid"):
            referent_uuid = UUID(bytes=proto_symbol.referent_uuid)
            referent = ir.get_by_uuid(referent_uuid)
            if not isinstance(referent, Block):
                raise DeserializationError(
                    "Symbol: UUID %s is not a block" % referent_uuid
                )
            symbol.referent = referent
        symbol._add_to_uuid_cache(ir._local_uuid_cache)
        return symbol

    def _to_protobuf(self) -> Symbol_pb2.Symbol:
        proto_symbol = Symbol_pb2.Symbol()
        proto_symbol.uuid = self.uuid.bytes
        if self.value is not None:
            proto_symbol.value = self.value
        elif self.referent is not None:
            proto_symbol.referent_uuid = self.referent.uuid.bytes
        proto_symbol.name = self.name
        proto_symbol.at_end = self.at_end
        return proto_symbol

    def deep_eq(self, other: object) -> bool:
        # Do not move __eq__. See docstring for Node.deep_eq for more info.
        if not isinstance(other, Symbol):
            return False
        if self.value != other.value:
            return False
        if self.referent is None:
            if other.referent is not None:
                return False
        else:
            if not self.referent.deep_eq(other.referent):
                return False
        return (
            self.name == other.name
            and self.at_end == other.at_end
            and self.uuid == other.uuid
        )

    def __repr__(self) -> str:
        return (
            "Symbol("
            "uuid={uuid!r}, "
            "name={name!r}, "
            "payload={payload!r}, "
            "at_end={at_end!r}, "
            ")".format(name=self.name, payload=self._payload, **self.__dict__)
        )

    @property
    def module(self) -> typing.Optional["Module"]:
        return self._module

    @module.setter
    def module(self, value: typing.Optional["Module"]) -> None:
        if self._module is not None:
            self._module.symbols.discard(self)
        if value is not None:
            value.symbols.add(self)

    def _add_to_uuid_cache(self, cache: typing.Dict[UUID, Node]) -> None:
        """Update the UUID cache when this node is added."""

        cache[self.uuid] = self

    def _remove_from_uuid_cache(self, cache: typing.Dict[UUID, Node]) -> None:
        """Update the UUID cache when this node is removed."""

        del cache[self.uuid]

    @property
    def ir(self) -> typing.Optional["IR"]:
        """Get the IR this node ultimately belongs to."""
        if self.module is None:
            return None
        return self.module.ir


================================================
FILE: python/gtirb/symbolicexpression.py
================================================
import typing
from enum import Enum
from uuid import UUID

from .node import Node
from .proto import SymbolicExpression_pb2
from .symbol import Symbol
from .util import DeserializationError

AttributesCtorType = typing.Iterable[
    typing.Union[
        "SymbolicExpression_pb2.SymAttribute.ValueType",
        "SymbolicExpression.Attribute",
    ]
]


class SymbolicExpression:
    """Base class of symbolic expression types."""

    class Attribute(Enum):
        """Attributes representing a known property of a symbolic expression.
        See https://grammatech.github.io/gtirb/md__symbolic_expression.html
        """

        GOT = SymbolicExpression_pb2.SymAttribute.Value("GOT")
        GOTPC = SymbolicExpression_pb2.SymAttribute.Value("GOTPC")
        GOTOFF = SymbolicExpression_pb2.SymAttribute.Value("GOTOFF")
        GOTREL = SymbolicExpression_pb2.SymAttribute.Value("GOTREL")
        PLT = SymbolicExpression_pb2.SymAttribute.Value("PLT")
        PLTOFF = SymbolicExpression_pb2.SymAttribute.Value("PLTOFF")
        PCREL = SymbolicExpression_pb2.SymAttribute.Value("PCREL")
        SECREL = SymbolicExpression_pb2.SymAttribute.Value("SECREL")
        TLS = SymbolicExpression_pb2.SymAttribute.Value("TLS")
        TLSGD = SymbolicExpression_pb2.SymAttribute.Value("TLSGD")
        TLSLD = SymbolicExpression_pb2.SymAttribute.Value("TLSLD")
        TLSLDM = SymbolicExpression_pb2.SymAttribute.Value("TLSLDM")
        TLSCALL = SymbolicExpression_pb2.SymAttribute.Value("TLSCALL")
        TLSDESC = SymbolicExpression_pb2.SymAttribute.Value("TLSDESC")
        TPREL = SymbolicExpression_pb2.SymAttribute.Value("TPREL")
        TPOFF = SymbolicExpression_pb2.SymAttribute.Value("TPOFF")
        DTPREL = SymbolicExpression_pb2.SymAttribute.Value("DTPREL")
        DTPOFF = SymbolicExpression_pb2.SymAttribute.Value("DTPOFF")
        DTPMOD = SymbolicExpression_pb2.SymAttribute.Value("DTPMOD")
        NTPOFF = SymbolicExpression_pb2.SymAttribute.Value("NTPOFF")
        PAGE = SymbolicExpression_pb2.SymAttribute.Value("PAGE")
        PAGEOFF = SymbolicExpression_pb2.SymAttribute.Value("PAGEOFF")
        CALL = SymbolicExpression_pb2.SymAttribute.Value("CALL")
        LO = SymbolicExpression_pb2.SymAttribute.Value("LO")
        HI = SymbolicExpression_pb2.SymAttribute.Value("HI")
        HIGHER = SymbolicExpression_pb2.SymAttribute.Value("HIGHER")
        HIGHEST = SymbolicExpression_pb2.SymAttribute.Value("HIGHEST")
        GOTNTPOFF = SymbolicExpression_pb2.SymAttribute.Value("GOTNTPOFF")
        INDNTPOFF = SymbolicExpression_pb2.SymAttribute.Value("INDNTPOFF")
        G0 = SymbolicExpression_pb2.SymAttribute.Value("G0")
        G1 = SymbolicExpression_pb2.SymAttribute.Value("G1")
        G2 = SymbolicExpression_pb2.SymAttribute.Value("G2")
        G3 = SymbolicExpression_pb2.SymAttribute.Value("G3")
        UPPER16 = SymbolicExpression_pb2.SymAttribute.Value("UPPER16")
        LOWER16 = SymbolicExpression_pb2.SymAttribute.Value("LOWER16")
        LO12 = SymbolicExpression_pb2.SymAttribute.Value("LO12")
        LO15 = SymbolicExpression_pb2.SymAttribute.Value("LO15")
        LO14 = SymbolicExpression_pb2.SymAttribute.Value("LO14")
        HI12 = SymbolicExpression_pb2.SymAttribute.Value("HI12")
        HI21 = SymbolicExpression_pb2.SymAttribute.Value("HI21")
        S = SymbolicExpression_pb2.SymAttribute.Value("S")
        PG = SymbolicExpression_pb2.SymAttribute.Value("PG")
        NC = SymbolicExpression_pb2.SymAttribute.Value("NC")
        ABS = SymbolicExpression_pb2.SymAttribute.Value("ABS")
        PREL = SymbolicExpression_pb2.SymAttribute.Value("PREL")
        PREL31 = SymbolicExpression_pb2.SymAttribute.Value("PREL31")
        TARGET1 = SymbolicExpression_pb2.SymAttribute.Value("TARGET1")
        TARGET2 = SymbolicExpression_pb2.SymAttribute.Value("TARGET2")
        SBREL = SymbolicExpression_pb2.SymAttribute.Value("SBREL")
        TLSLDO = SymbolicExpression_pb2.SymAttribute.Value("TLSLDO")
        HI16 = SymbolicExpression_pb2.SymAttribute.Value("HI16")
        LO16 = SymbolicExpression_pb2.SymAttribute.Value("LO16")
        GPREL = SymbolicExpression_pb2.SymAttribute.Value("GPREL")
        DISP = SymbolicExpression_pb2.SymAttribute.Value("DISP")
        OFST = SymbolicExpression_pb2.SymAttribute.Value("OFST")
        H = SymbolicExpression_pb2.SymAttribute.Value("H")
        L = SymbolicExpression_pb2.SymAttribute.Value("L")
        HA = SymbolicExpression_pb2.SymAttribute.Value("HA")
        HIGH = SymbolicExpression_pb2.SymAttribute.Value("HIGH")
        HIGHA = SymbolicExpression_pb2.SymAttribute.Value("HIGHA")
        HIGHERA = SymbolicExpression_pb2.SymAttribute.Value("HIGHERA")
        HIGHESTA = SymbolicExpression_pb2.SymAttribute.Value("HIGHESTA")
        TOCBASE = SymbolicExpression_pb2.SymAttribute.Value("TOCBASE")
        TOC = SymbolicExpression_pb2.SymAttribute.Value("TOC")
        NOTOC = SymbolicExpression_pb2.SymAttribute.Value("NOTOC")

        def __repr__(self) -> str:
            return "SymbolicExpression.Attribute.%s" % self.name

        def __int__(self) -> int:
            return self.value

    def __init__(
        self,
        attributes: AttributesCtorType = set(),
    ):
        self.attributes = set(attributes)

    @property
    def symbols(self) -> typing.Iterable[Symbol]:
        """Get all the symbols involved with this symbolic expression,
        regardless of role.
        """

        raise NotImplementedError  # pragma: no cover

    def deep_eq(self, other: object) -> bool:
        raise NotImplementedError  # pragma: no cover

    def _attributes_repr(self) -> str:
        if not self.attributes:
            return "set()"
        else:
            return "{%s}" % ",".join(repr(a) for a in self.attributes)


class SymAddrAddr(SymbolicExpression):
    """Represents a symbolic expression of the form
    "(Sym1 - Sym2) / Scale + Offset".

    :ivar ~.scale: Constant scale factor.
    :ivar ~.offset: Constant offset.
    :ivar ~.symbol1: Symbol representing the base address.
    :ivar ~.symbol2: Symbol to subtract from ``symbol1``.
    """

    def __init__(
        self,
        scale: int,
        offset: int,
        symbol1: Symbol,
        symbol2: Symbol,
        attributes: AttributesCtorType = set(),
    ):
        """
        :param scale: Constant scale factor.
        :param offset: Constant offset.
        :param symbol1: Symbol representing the base address.
        :param symbol2: Symbol to subtract from ``symbol1``.
        :param attributes: :class:`SymobolicExpression.Attribute`\\s of this
            expression.
        """
        super().__init__(attributes)
        self.scale = scale
        self.offset = offset
        self.symbol1 = symbol1
        self.symbol2 = symbol2

    @classmethod
    def _from_protobuf(
        cls,
        proto_symaddraddr: SymbolicExpression_pb2.SymAddrAddr,
        get_by_uuid: typing.Callable[[UUID], typing.Optional[Node]],
    ) -> "SymAddrAddr":
        symbol1_uuid = UUID(bytes=proto_symaddraddr.symbol1_uuid)
        symbol1 = get_by_uuid(symbol1_uuid)
        if not isinstance(symbol1, Symbol):
            raise DeserializationError(
                "SymAddrAddr: UUID %s is not a Symbol" % symbol1_uuid
            )
        symbol2_uuid = UUID(bytes=proto_symaddraddr.symbol2_uuid)
        symbol2 = get_by_uuid(symbol2_uuid)
        if not isinstance(symbol2, Symbol):
            raise DeserializationError(
                "SymAddrAddr: UUID %s is not a Symbol" % symbol2_uuid
            )
        return cls(
            proto_symaddraddr.scale, proto_symaddraddr.offset, symbol1, symbol2
        )

    def _to_protobuf(self) -> SymbolicExpression_pb2.SymAddrAddr:
        proto_symaddraddr = SymbolicExpression_pb2.SymAddrAddr()
        proto_symaddraddr.scale = self.scale
        proto_symaddraddr.offset = self.offset
        proto_symaddraddr.symbol1_uuid = self.symbol1.uuid.bytes
        proto_symaddraddr.symbol2_uuid = self.symbol2.uuid.bytes
        return proto_symaddraddr

    def __eq__(self, other: object) -> bool:
        if not isinstance(other, SymAddrAddr):
            return False
        return (
            self.scale == other.scale
            and self.offset == other.offset
            and self.symbol1.uuid == other.symbol1.uuid
            and self.symbol2.uuid == other.symbol2.uuid
            and self.attributes == other.attributes
        )

    def __hash__(self) -> int:
        return hash(
            (self.offset, self.scale, self.symbol1.uuid, self.symbol2.uuid)
        )

    def __repr__(self) -> str:
        return (
            "SymAddrAddr("
            "scale={scale!r}, "
            "offset={offset!r}, "
            "symbol1={symbol1!r}, "
            "symbol2={symbol2!r}, "
            "attributes={attributes_repr!s}, "
            ")"
        ).format(
            scale=self.scale,
            offset=self.offset,
            symbol1=self.symbol1,
            symbol2=self.symbol2,
            attributes_repr=self._attributes_repr(),
        )

    def deep_eq(self, other: object) -> bool:
        # Do not move __eq__. See docstring for Node.deep_eq for more info.
        if not isinstance(other, SymAddrAddr):
            return False
        return (
            self.scale == other.scale
            and self.offset == other.offset
            and self.symbol1.deep_eq(other.symbol1)
            and self.symbol2.deep_eq(other.symbol2)
            and self.attributes == other.attributes
        )

    @property
    def symbols(self) -> typing.Iterable[Symbol]:
        yield self.symbol1
        yield self.symbol2


class SymAddrConst(SymbolicExpression):
    """Represents a symbolic expression of the form "Sym + Offset".

    :ivar ~.offset: Constant offset.
    :ivar ~.symbol: Symbol representing an address.
    """

    def __init__(
        self,
        offset: int,
        symbol: Symbol,
        attributes: AttributesCtorType = set(),
    ):
        """
        :param offset: Constant offset.
        :param symbol: Symbol representing an address.
        :param attributes: :class:`SymbolicExpression.Attribute`\\s of this
            expression.
        """
        super().__init__(attributes)
        self.offset = offset
        self.symbol = symbol

    @classmethod
    def _from_protobuf(
        cls,
        proto_symaddrconst: SymbolicExpression_pb2.SymAddrConst,
        get_by_uuid: typing.Callable[[UUID], typing.Optional[Node]],
    ) -> "SymAddrConst":
        symbol_uuid = UUID(bytes=proto_symaddrconst.symbol_uuid)
        symbol = get_by_uuid(symbol_uuid)
        if not isinstance(symbol, Symbol):
            raise DeserializationError(
                "SymAddrConst: UUID %s is not a Symbol" % symbol_uuid
            )
        return cls(proto_symaddrconst.offset, symbol)

    def _to_protobuf(self) -> SymbolicExpression_pb2.SymAddrConst:
        proto_symaddrconst = SymbolicExpression_pb2.SymAddrConst()
        proto_symaddrconst.offset = self.offset
        if self.symbol is not None:
            proto_symaddrconst.symbol_uuid = self.symbol.uuid.bytes
        return proto_symaddrconst

    def __eq__(self, other: object) -> bool:
        if not isinstance(other, SymAddrConst):
            return False
        return (
            self.offset == other.offset
            and self.symbol.uuid == other.symbol.uuid
            and self.attributes == other.attributes
        )

    def __hash__(self) -> int:
        return hash((self.offset, self.symbol.uuid))

    def __repr__(self) -> str:
        return (
            "SymAddrConst("
            "offset={offset!r}, "
            "symbol={symbol!r}, "
            "attributes={attributes_repr!s}, "
            ")"
        ).format(
            offset=self.offset,
            symbol=self.symbol,
            attributes_repr=self._attributes_repr(),
        )

    def deep_eq(self, other: object) -> bool:
        # Do not move __eq__. See docstring for Node.deep_eq for more info.
        if not isinstance(other, SymAddrConst):
            return False
        return (
            self.offset == other.offset
            and self.symbol.deep_eq(other.symbol)
            and self.attributes == other.attributes
        )

    @property
    def symbols(self) -> typing.Iterable[Symbol]:
        yield self.symbol


================================================
FILE: python/gtirb/util.py
================================================
"""General utilities usable by any other GTIRB submoudle."""

import itertools
import typing

import intervaltree
import typing_extensions

K = typing.TypeVar("K")
V = typing.TypeVar("V")
T = typing.TypeVar("T")
T_cov = typing.TypeVar("T_cov", covariant=True)
T_contra = typing.TypeVar("T_contra", contravariant=True)
S = typing.TypeVar("S")


DictLike = typing.Union[
    typing.Mapping[K, V],
    typing.Iterable[typing.Tuple[K, V]],
]
"""Any value that can be passed to the constructor of ``dict``;
that is, a mapping or iterable yielding key-value tuples.
"""


class GtirbError(Exception):
    pass


class DeserializationError(GtirbError):
    pass


class _SymbolicExpressionContainer(typing_extensions.Protocol[T_cov]):
    """A container of symbolic expressions at addresses."""

    def symbolic_expressions_at(
        self, addrs: typing.Union[int, range]
    ) -> typing.Iterable[T_cov]:
        ...  # pragma: no cover


class ListWrapper(typing.MutableSequence[T]):
    def __init__(self, *args: typing.Iterable[T]):
        self._data: typing.List[T] = []
        for values in args:
            for value in values:
                self.append(value)

    def _add(self, value: T) -> None:
        pass  # pragma: no cover

    def _remove(self, value: T) -> None:
        pass  # pragma: no cover

    # begin functions for ABC
    @typing.overload
    def __getitem__(self, i: int) -> T:
        ...  # pragma: no cover

    @typing.overload
    def __getitem__(self, i: slice) -> typing.MutableSequence[T]:
        ...  # pragma: no cover

    def __getitem__(
        self, i: typing.Union[int, slice]
    ) -> typing.Union[T, typing.MutableSequence[T]]:
        return self._data[i]

    @typing.overload
    def __setitem__(self, i: typing_extensions.SupportsIndex, v: T) -> None:
        ...  # pragma: no cover

    @typing.overload
    def __setitem__(self, i: slice, v: typing.Iterable[T]) -> None:
        ...  # pragma: no cover

    def __setitem__(
        self,
        i: typing.Union[typing_extensions.SupportsIndex, slice],
        v: typing.Union[T, typing.Iterable[T]],
    ) -> None:
        if isinstance(i, slice):
            assert isinstance(v, typing.Iterable)
            indices = range(*i.indices(len(self)))
            values = list(v)
        elif -len(self._data) <= i.__index__() < len(self._data):
            indices = range(i.__index__(), i.__index__() + 1)
            values = [typing.cast(T, v)]
        else:
            raise IndexError("list assignment index out of range")
        for index in indices:
            self._remove(self._data[index])
        for value in values:
            self._add(value)
        if isinstance(i, slice):
            self._data[i] = values
        else:
            self._data[i] = values[0]

    @typing.overload
    def __delitem__(self, i: int) -> None:
        ...  # pragma: no cover

    @typing.overload
    def __delitem__(self, i: slice) -> None:
        ...  # pragma: no cover

    def __delitem__(self, i: typing.Union[int, slice]) -> None:
        if isinstance(i, slice):
            indices = range(*i.indices(len(self)))
        else:
            indices = range(i, i + 1)
        for index in indices:
            self._remove(self._data[index])

        del self._data[i]

    def __len__(self) -> int:
        return len(self._data)

    def insert(self, i: int, v: T) -> None:
        self._add(v)
        return self._data.insert(i, v)

    # The version of typing.py which comes with python 3.5.2 doesn't provide
    # definitions for append or remove on MutableList, so we have to do it
    # ourselves.
    def append(self, v: T) -> None:
        self.insert(len(self), v)

    def remove(self, v: T) -> None:
        del self[self._data.index(v)]

    # extend is not in every version of Python 3, so list wrapper adds it here
    # itself.
    def extend(self, other: typing.Iterable[T]) -> None:
        for v in other:
            self.append(v)

    # end functions for ABC
    def __str__(self) -> str:
        return str(self._data)

    def __repr__(self) -> str:
        return repr(self._data)


# A type variable for the SetWrapper's "self" type. Since type variables cannot
# have a generic bound (see https://github.com/python/mypy/issues/2756), we
# need to use Any instead. Which we then have to tell mypy to ignore.
#
# Used in __ior__.
_SetWrapperSelf = typing.TypeVar(  # type: ignore[misc]
    "_SetWrapperSelf", bound="SetWrapper[typing.Any]"
)


class SetWrapper(typing.MutableSet[T]):
    def __init__(self, *args: typing.Iterable[T]):
        self._data: typing.Set[T] = set()
        for arg in args:
            for v in arg:
                self.add(v)

    # begin functions for ABC
    def __contains__(self, v: object) -> bool:
        return v in self._data

    def __iter__(self) -> typing.Iterator[T]:
        return iter(self._data)

    def __len__(self) -> int:
        return len(self._data)

    def add(self, v: T) -> None:
        return self._data.add(v)

    def discard(self, v: T) -> None:
        return self._data.discard(v)

    # end functions for ABC

    # The version of typing.py which comes with python 3.5.2 doesn't provide
    # definitions for __or__ or clear on MutableSet, so we have to do it
    # ourselves.
    def __or__(
        self, other: typing.AbstractSet[S]
    ) -> typing.Set[typing.Union[T, S]]:
        return self._data | other

    # The type declaration for __ior__ in typeshed's MutableSet is problematic.
    # MutableSet requires __ior__ to accept an AbstractSet[S], and return a
    # Mutable[T|S]. This results in a type error when the result is assigned
    # back to the original variable unless S is T. Since this can't actually be
    # used if S is not T and is much easier to implement if S is T anyway, we
    # declare it to only accept AbstractSet[T]. This causes mypy to report an
    # error for incompatible override types and different return types for
    # __ior__ and __or__, which we ignore.
    def __ior__(  # type: ignore
        self: _SetWrapperSelf, other: typing.AbstractSet[T]
    ) -> _SetWrapperSelf:
        for value in other:
            self.add(value)
        return self

    def pop(self) -> T:
        it = iter(self)
        # pop is documented as raising a KeyError if it's empty, not
        # StopIteration
        try:
            result = next(it)
        except StopIteration:
            raise KeyError
        self.discard(result)
        return result

    def clear(self) -> None:
        while self:
            self.pop()

    # For whatever reason, update isn't included as part of abc.MutableSet.
    def update(self, *others: typing.Iterable[T]) -> None:
        for other in others:
            for v in other:
                self.add(v)

    def __str__(self) -> str:
        return str(self._data)

    def __repr__(self) -> str:
        return repr(self._data)


class DictWrapper(typing.MutableMapping[K, V]):
    def __init__(self, *args: DictLike[K, V]):
        self._data: typing.MutableMapping[K, V] = {}
        # Create a temporary dictionary so we can uniformly access the items
        # and add them to _data.
        temp: typing.Dict[K, V] = dict(*args)
        for i, v in temp.items():
            self[i] = v

    # begin functions for ABC
    def __getitem__(self, i: K) -> V:
        return self._data[i]

    def __setitem__(self, i: K, v: V) -> None:
        self._data[i] = v

    def __delitem__(self, i: K) -> None:
        del self._data[i]

    def __iter__(self) -> typing.Iterator[K]:
        return iter(self._data)

    def __len__(self) -> int:
        return len(self._data)

    # end functions for ABC
    def __str__(self) -> str:
        return str(self._data)

    def __repr__(self) -> str:
        return repr(self._data)


InstanceT = typing.TypeVar("InstanceT")
AttributeT = typing.TypeVar("AttributeT")


class IndexedContainer(typing_extensions.Protocol[T_contra]):
    """Container wth an index that can be updated."""

    def _index_discard(self, instance: T_contra) -> None:
        ...  # pragma: no cover

    def _index_add(self, instance: T_contra) -> None:
        ...  # pragma: no cover


class ParentGetter(typing_extensions.Protocol[T_contra]):
    """Interface for getting an _IndexedContainer for an instance."""

    def __call__(
        self, instance: T_contra
    ) -> typing.Optional[IndexedContainer[T_contra]]:
        ...  # pragma: no cover


class _IndexedAttribute(typing.Generic[AttributeT]):
    """
    The _IndexedAttribute descriptor notifies a parent when the attribute is
    modified. The outer class is generic in the attribute type and provides a
    __call__ method to deduce the remaining type parameters and construct the
    descriptor itself.

    Example usage:

    class Foo:
        my_int = _IndexedAttribute[int]()(lambda foo: foo.parent)
    """

    class Descriptor(typing.Generic[InstanceT]):
        """
        A descriptor that will notify a parent when the value is set and can be
        otherwise used like a normal attribute.
        """

        def __init__(self, parent_getter: ParentGetter[InstanceT]):
            self.parent_getter = parent_getter

        def __get__(
            self,
            instance: InstanceT,
            owner: typing.Type[InstanceT] = None,
        ) -> AttributeT:
            return getattr(instance, self.attribute_name)

        def __set__(self, instance: InstanceT, value: AttributeT) -> None:
            parent = self.parent_getter(instance)
            if parent:
                parent._index_discard(instance)
            setattr(instance, self.attribute_name, value)
            parent = self.parent_getter(instance)
            if parent:
                parent._index_add(instance)

        def __delete__(self, instance: InstanceT) -> None:
            raise AttributeError("can't delete attribute %s" % (self.name))

        def __set_name__(self, owner: InstanceT, name: str) -> None:
            self.name = name
            self.attribute_name = "_" + name

    def __call__(self, parent_getter: ParentGetter[InstanceT]) -> AttributeT:
        """
        Create the descriptor, but tell mypy it is the attribute type.

        The cast helps mypy recognize when the instance type satisfies a
        protocol. Mypy checks to see if the class matches the protocol instead
        of the instance. However, descriptors are treated as the descriptor
        type in the class and the attribute type in the instance. This causes
        mypy to reject the protocol, even though it works correctly at runtime.
        """
        return typing.cast(
            AttributeT, self.Descriptor[InstanceT](parent_getter)
        )


def get_desired_range(addrs: typing.Union[int, range]) -> range:
    if isinstance(addrs, int):
        return range(addrs, addrs + 1)
    else:
        return addrs


class AddrRange(typing_extensions.Protocol):
    """An object spanning a range of addresses."""

    # Protocol field types must match exactly, but properties are allowed to
    # return subtypes. This means that a class whose address or size is an int
    # will match Optional[int] properties, but not Optional[int] fields.

    @property
    def address(self) -> typing.Optional[int]:
        ...  # pragma: no cover

    @property
    def size(self) -> typing.Optional[int]:
        ...  # pragma: no cover


# Need a TypeVar bounded by the protocol so that nodes_on callers will get
# back the actual node type, not an AddrRange.
AddrRangeT = typing.TypeVar("AddrRangeT", bound=AddrRange)


def nodes_on(
    nodes: typing.Iterable[AddrRangeT],
    addrs: typing.Union[int, range],
) -> typing.Iterable[AddrRangeT]:
    desired_range = get_desired_range(addrs)
    for node in nodes:
        node_addr = node.address
        if node_addr is not None:
            node_size = node.size
            assert node_size is not None
            node_range = range(node_addr, node_addr + node_size)
            if range(
                max(desired_range.start, node_range.start),
                min(desired_range.stop, node_range.stop),
            ):
                yield node


def nodes_at(
    nodes: typing.Iterable[AddrRangeT],
    addrs: typing.Union[int, range],
) -> typing.Iterable[AddrRangeT]:
    desired_range = get_desired_range(addrs)
    for node in nodes:
        node_addr = node.address
        if node_addr is not None and node_addr in desired_range:
            yield node


def _address_interval(
    node: AddrRangeT,
) -> "typing.Optional[intervaltree.Interval[int, AddrRangeT]]":
    """
    Creates an interval tree interval based on a GTIRB node's address and
    size or returns None, if the node has no address.
    """
    node_address = node.address
    if node_address is not None:
        node_size = node.size
        assert node_size is not None
        return intervaltree.Interval(
            node_address, node_address + node_size + 1, node
        )
    else:
        return None


class OffsetRange(typing_extensions.Protocol):
    """An object spanning a range of offsets."""

    @property
    def offset(self) -> int:
        ...  # pragma: no cover

    @property
    def size(self) -> int:
        ...  # pragma: no cover


OffsetRangeT = typing.TypeVar("OffsetRangeT", bound=OffsetRange)


def _offset_interval(
    node: OffsetRangeT,
) -> "intervaltree.Interval[int, OffsetRangeT]":
    """
    Creates an interval tree interval based on a GTIRB node's offset and size.
    """
    return intervaltree.Interval(
        node.offset, node.offset + node.size + 1, node
    )


def _nodes_on_interval_tree_impl(
    tree: "intervaltree.IntervalTree[int, T]",
    addrs: typing.Union[int, range],
    *,
    interval_getter: typing.Callable[
        [T], typing.Optional["intervaltree.Interval[int, T]"]
    ],
    adjustment: int = 0,
) -> typing.Iterable[T]:
    """
    Implements nodes_on for an IntervalTree.
    :param tree: The IntervalTree to search.
    :param addrs: The address or addresses to locate nodes on.
    :param interval_getter: Get the node's interval.
    :param adjustment: An adjustment to be applied to the search range before
           consulting the interval tree.
    """

    desired_range = get_desired_range(addrs)
    for interval in tree.overlap(
        desired_range.start + adjustment, desired_range.stop + adjustment
    ):
        node = interval.data
        node_interval = interval_getter(node)
        if node_interval is None:
            continue

        # We explicitly exclude zero-sized blocks to match the existing
        # nodes_on function and prior behavior of callers before they switched
        # to using an interval tree.
        if not node_interval.length() - 1:
            continue

        # Our interval tree ranges are closed, so we need to make sure not to
        # return items the caller didn't request.
        if node_interval.end - 1 <= desired_range.start:
            continue

        yield node


def _nodes_on_interval_tree(
    tree: "intervaltree.IntervalTree[int, AddrRangeT]",
    addrs: typing.Union[int, range],
    adjustment: int = 0,
) -> typing.Iterable[AddrRangeT]:
    """
    Implements nodes_on for an IntervalTree by address.
    :param tree: The IntervalTree to search.
    :param addrs: The address or addresses to locate nodes on.
    :param adjustment: An adjustment to be applied to the search range before
           consulting the interval tree.
    """

    return _nodes_on_interval_tree_impl(
        tree, addrs, interval_getter=_address_interval, adjustment=adjustment
    )


def _nodes_on_interval_tree_offset(
    tree: "intervaltree.IntervalTree[int, OffsetRangeT]",
    addrs: typing.Union[int, range],
) -> typing.Iterable[OffsetRangeT]:
    """
    Implements nodes_on for an IntervalTree by offset.
    :param tree: The IntervalTree to search.
    :param addrs: The address or addresses to locate nodes on.
    """

    return _nodes_on_interval_tree_impl(
        tree, addrs, interval_getter=_offset_interval
    )


def _nodes_at_interval_tree_impl(
    tree: "intervaltree.IntervalTree[int, T]",
    addrs: typing.Union[int, range],
    *,
    bounds_getter: typing.Callable[
        [T], typing.Optional["intervaltree.Interval[int, T]"]
    ],
    adjustment: int = 0,
) -> typing.Iterable[T]:
    """
    Implements nodes_at for an IntervalTree.
    :param tree: The IntervalTree to search.
    :param addrs: The address or addresses to locate nodes at.
    :param adjustment: An adjustment to be applied to the search range before
           consulting the interval tree.
    """

    desired_range = get_desired_range(addrs)
    for interval in tree.overlap(
        desired_range.start + adjustment, desired_range.stop + adjustment
    ):
        bounds = bounds_getter(interval.data)
        if not bounds:
            continue

        # Check that it's actually in our desired range, which may have a
        # step value that excludes it. This is a constant time operation.
        if bounds.begin in desired_range:
            yield interval.data


def _nodes_at_interval_tree(
    tree: "intervaltree.IntervalTree[int, AddrRangeT]",
    addrs: typing.Union[int, range],
    adjustment: int = 0,
) -> typing.Iterable[AddrRangeT]:
    """
    Implements nodes_at for an IntervalTree.
    :param tree: The IntervalTree to search.
    :param addrs: The address or addresses to locate nodes at.
    :param adjustment: An adjustment to be applied to the search range before
           consulting the interval tree.
    """

    return _nodes_at_interval_tree_impl(
        tree, addrs, bounds_getter=_address_interval, adjustment=adjustment
    )


def _nodes_at_interval_tree_offset(
    tree: "intervaltree.IntervalTree[int, OffsetRangeT]",
    offsets: typing.Union[int, range],
) -> typing.Iterable[OffsetRangeT]:
    """
    Implements nodes_at for an IntervalTree by offset.
    :param tree: The IntervalTree to search.
    :param offsets: The offset or offsets to locate nodes at.
    """

    return _nodes_at_interval_tree_impl(
        tree, offsets, bounds_getter=_offset_interval
    )


def symbolic_expressions_at(
    nodes: typing.Iterable[_SymbolicExpressionContainer[T_cov]],
    addrs: typing.Union[int, range],
) -> typing.Iterable[T_cov]:
    return itertools.chain.from_iterable(
        node.symbolic_expressions_at(addrs) for node in nodes
    )


================================================
FILE: python/mypy.ini.in
================================================
[mypy]
python_version = 3.8
mypy_path = @CMAKE_CURRENT_SOURCE_DIR@/stubs
show_error_codes = True
show_column_numbers = True

disallow_incomplete_defs = True
disallow_untyped_calls = True
disallow_untyped_decorators = True
disallow_untyped_defs = True

disallow_any_decorated = True
disallow_any_explicit = True
disallow_any_generics = True
disallow_any_unimported = True
disallow_subclassing_any = True


================================================
FILE: python/pyproject.toml.in
================================================
[build-system]
requires = ["setuptools >= 64"]
build-backend = "setuptools.build_meta"

[project]
name = "gtirb"
dynamic = ["version"]
description = "GrammaTech Intermediate Representation for Binaries"
readme = "README"
authors = [
    {name = "GrammaTech", email="gtirb@grammatech.com"},
]
license = {text = "MIT"}

requires-python = ">= 3.8"

classifiers = [
    "Development Status :: 5 - Production/Stable",
    "License :: OSI Approved :: MIT License",
    "Operating System :: OS Independent",
    "Programming Language :: Python :: 3",
    "Programming Language :: Python :: 3.8",
    "Programming Language :: Python :: 3.9",
    "Programming Language :: Python :: 3.10",
    "Programming Language :: Python :: 3.11",
    "Programming Language :: Python :: 3.12",
    "Programming Language :: Python :: 3.13",
]

dependencies = [
    "intervaltree >= 3.0",
    "networkx >= 2.3",
    "networkx >= 2.6; python_version >= '3.9'",
    "@GTIRB_PROTOBUF_CONSTRAINT@",
    "protobuf >= 3.8; python_version >= '3.10'",
    # TODO: uncomment after we drop support for protobuf < 3.19.
    # "protobuf >= 5.27; python_version >= '3.14'",
    "sortedcontainers >= 2.0",
    "sortedcontainers >= 2.0.5; python_version >= '3.10'",
    "typing-extensions >= 3.7.4.3",
]

[project.urls]
Homepage = "https://github.com/grammatech/gtirb"
Documentation = "https://grammatech.github.io/gtirb/python/index.html"
Repository = "https://github.com/grammatech/gtirb.git"
Issues = "https://github.com/GrammaTech/gtirb/issues"

[tool.setuptools]
packages = ["gtirb", "gtirb.proto"]

[tool.setuptools.dynamic]
version = {attr = "gtirb.version.API_VERSION"}

[tool.coverage.run]
source_pkgs = ["gtirb"]
omit = ["*/gtirb/proto/*"]
branch = true

[tool.coverage.report]
fail_under = 75
show_missing = true

[tool.coverage.paths]
source = [
    ".",
    "*/site-packages",
]


================================================
FILE: python/requirements-dev.txt
================================================
pre-commit>=3.0
pytest>=7.4
pytest-cov>=4.0
sphinx >= 7.0
sphinx-autodoc-typehints >= 2.0
tox>=4.0
tox-uv>=1.0


================================================
FILE: python/requirements-mypy.txt
================================================
# Type stubs have a separate requirements file so they can be excluded from the
# prerelease environments in tox.ini. In particular, mypy-protobuf depends on a
# much newer version of protobuf than we actually require at runtime.
mypy==0.961
mypy-protobuf==3.3.0
types-protobuf==3.20.4


================================================
FILE: python/stubs/README.md
================================================
Stubs for packages that do not include type annotations recognized by mypy.

Generic type stubs were handwritten to enable more precise type checking.
They are deliberately incomplete, only including the operations used in the
GTIRB implementation.


================================================
FILE: python/stubs/intervaltree/__init__.pyi
================================================
from .interval import Interval as Interval
from .intervaltree import IntervalTree as IntervalTree


================================================
FILE: python/stubs/intervaltree/interval.pyi
================================================
from typing import Generic, TypeVar

PointT = TypeVar("PointT", covariant=True)
DataT = TypeVar("DataT", covariant=True)

class Interval(Generic[PointT, DataT]):
    begin: PointT
    end: PointT
    data: DataT
    def __init__(self, begin: PointT, end: PointT, data: DataT): ...
    def length(self) -> PointT: ...


================================================
FILE: python/stubs/intervaltree/intervaltree.pyi
================================================
from typing import Iterable, Iterator, MutableSet, Set, TypeVar, overload

from .interval import Interval

PointT = TypeVar("PointT")
DataT = TypeVar("DataT")

class IntervalTree(MutableSet[Interval[PointT, DataT]]):
    def __init__(
        self, intervals: Iterable[Interval[PointT, DataT]] | None = ...
    ): ...
    def __contains__(self, item: object) -> bool: ...
    def __iter__(self) -> Iterator[Interval[PointT, DataT]]: ...
    def __len__(self) -> int: ...
    def add(self, interval: Interval[PointT, DataT]) -> None: ...
    def discard(self, interval: Interval[PointT, DataT]) -> None: ...
    def begin(self) -> PointT: ...
    def span(self) -> PointT: ...
    @overload
    def overlap(
        self, begin: Interval[PointT, DataT]
    ) -> Set[Interval[PointT, DataT]]: ...
    @overload
    def overlap(
        self, begin: PointT, end: PointT
    ) -> Set[Interval[PointT, DataT]]: ...


================================================
FILE: python/stubs/networkx/__init__.pyi
================================================
from networkx.classes import *


================================================
FILE: python/stubs/networkx/classes/__init__.pyi
================================================
from .multidigraph import MultiDiGraph as MultiDiGraph


================================================
FILE: python/stubs/networkx/classes/multidigraph.pyi
================================================
from typing import (
    Collection,
    Dict,
    Generic,
    Iterable,
    Tuple,
    TypeVar,
    overload,
)
from typing_extensions import Literal

NodeT = TypeVar("NodeT")
KeyT = TypeVar("KeyT")
DataT = TypeVar("DataT")

class MultiDiGraph(Generic[NodeT, KeyT, DataT]):
    def __contains__(self, n: object) -> bool: ...
    def __getitem__(
        self, n: NodeT
    ) -> Dict[NodeT, Dict[KeyT, Dict[str, DataT]]]: ...
    def add_edge(
        self, u: NodeT, v: NodeT, key: KeyT | None = ..., **attr: DataT
    ) -> KeyT: ...
    def remove_edge(
        self, u: NodeT, v: NodeT, key: KeyT | None = ...
    ) -> None: ...
    def number_of_edges(
        self, u: NodeT | None = ..., v: NodeT | None = ...
    ) -> int: ...
    def clear(self) -> None: ...
    # The actual types of edges(), out_edges(), and in_edges() are remarkably
    # complicated. Depending on various combinations of arguments, they can
    # retrieve a collection of tuples of two, three, or four elements. These
    # overloads are specifically just the cases currently used by CFG, and do
    # not remotely cover all valid combinations of arguments.
    @overload
    def edges(
        self,
        nbunch: Iterable[NodeT] | NodeT | None = ...,
        data: Literal[False] = ...,
    ) -> Collection[Tuple[NodeT, NodeT]]: ...
    @overload
    def edges(
        self,
        nbunch: Iterable[NodeT] | NodeT | None = ...,
        *,
        data: str,
        default: DataT | None = ...,
    ) -> Collection[Tuple[NodeT, NodeT, DataT | None]]: ...
    def out_edges(
        self,
        nbunch: Iterable[NodeT] | NodeT | None = ...,
        *,
        data: str = ...,
        default: DataT | None = ...,
    ) -> Collection[Tuple[NodeT, NodeT, DataT | None]]: ...
    def in_edges(
        self,
        nbunch: Iterable[NodeT] | NodeT | None = ...,
        *,
        data: str = ...,
        default: DataT | None = ...,
    ) -> Collection[Tuple[NodeT, NodeT, DataT | None]]: ...


================================================
FILE: python/stubs/sortedcontainers/__init__.pyi
================================================
from .sorteddict import SortedDict as SortedDict


================================================
FILE: python/stubs/sortedcontainers/sorteddict.pyi
================================================
from typing import MutableMapping, Iterator, Tuple, TypeVar

K = TypeVar("K")
V = TypeVar("V")

class SortedDict(MutableMapping[K, V]):
    def __delitem__(self, key: K) -> None: ...
    def __getitem__(self, key: K) -> V: ...
    def __iter__(self) -> Iterator[K]: ...
    def __len__(self) -> int: ...
    def __setitem__(self, key: K, value: V) -> None: ...
    def irange(
        self,
        minimum: K | None = ...,
        maximum: K | None = ...,
        inclusive: Tuple[bool, bool] = ...,
        reverse: bool = ...,
    ) -> Iterator[K]: ...


================================================
FILE: python/tests/helpers.py
================================================
import enum
import functools

import gtirb


class SearchScope(enum.Enum):
    ir = 1
    module = 2
    section = 3
    byte_interval = 4

    def select(self, ir, m, s, bi):
        """
        Given an IR, Module, Section, and ByteInterval, returns the object
        that matches this scope.
        """
        if self == SearchScope.ir:
            return ir
        if self == SearchScope.module:
            return m
        if self == SearchScope.section:
            return s
        if self == SearchScope.byte_interval:
            return bi
        assert False


def parameterize_one(name, values):
    """
    A decorator that paramaterizes a test case.
    :param name: The parameter name to parameterize.
    :param values: The values to supply to the parameter.
    """

    def decorator(f):
        @functools.wraps(f)
        def run_test(self, *args, **kwargs):
            for value in values:
                arg = {name: value}
                with self.subTest(**arg):
                    f(self, *args, **arg, **kwargs)

        return run_test

    return decorator


def create_interval_etc(address, size):
    """
    Creates a byte interval and all of the containing structures.
    """
    ir = gtirb.IR()
    m = gtirb.Module(name="test", ir=ir)
    s = gtirb.Section(name=".text", module=m)
    bi = gtirb.ByteInterval(address=address, size=size, section=s)
    return ir, m, s, bi


================================================
FILE: python/tests/test_auxdata.py
================================================
import unittest
from unittest import mock

import gtirb


class AuxDataTest(unittest.TestCase):
    def setUp(self):
        self.fake_ir = mock.MagicMock()
        self.fake_ir.get_by_uuid = None

    def test_lazy(self):
        ad1 = gtirb.AuxData("test1", "string")
        self.assertEqual(ad1.data, "test1")

        serialized = ad1._to_protobuf()
        ad2 = gtirb.AuxData._from_protobuf(serialized, self.fake_ir)
        # Peek inside: the data is not yet deserialized
        self.assertTrue(ad2._data is None)

        # Accessing the data should deserialize
        self.assertEqual(ad1.data, ad2.data)
        self.assertTrue(ad2._data is not None)

        # Just exercise repr
        self.assertEqual(
            repr(ad2), "AuxData(type_name='string', data='test1', )"
        )

    def test_lazy_never_deserialized(self):
        serialized = gtirb.AuxData("testing 123", "string")._to_protobuf()

        ad1 = gtirb.AuxData._from_protobuf(serialized, self.fake_ir)
        # Peek inside: the data is not yet deserialized
        self.assertTrue(ad1._data is None)

        serialized2 = ad1._to_protobuf()
        self.assertTrue(ad1._data is None)
        self.assertEqual(serialized, serialized2)


if __name__ == "__main__":
    unittest.main()


================================================
FILE: python/tests/test_block.py
================================================
import unittest

from helpers import create_interval_etc

import gtirb


class BlockTest(unittest.TestCase):
    def test_contains_offset(self):
        node = gtirb.CodeBlock(offset=123, size=456, decode_mode=789)
        self.assertTrue(node.contains_offset(127))
        self.assertFalse(node.contains_offset(121))

    def test_contains_address(self):
        block = gtirb.CodeBlock(offset=123, size=456, decode_mode=789)
        byte_interval = gtirb.ByteInterval(  # noqa: F841
            address=0x0, size=579, blocks=(block,)
        )
        self.assertTrue(block.contains_address(323))  # addr: 0x143
        self.assertFalse(block.contains_address(107))  # addr: 0x6b

    def test_block_references(self):
        ir, m, s, bi = create_interval_etc(address=0x1000, size=4)
        b1 = gtirb.CodeBlock(offset=0, size=2, byte_interval=bi)
        b2 = gtirb.CodeBlock(offset=2, size=2, byte_interval=bi)

        found = set(b1.references)
        self.assertEqual(found, set())

        s1 = gtirb.Symbol(name="hello", module=m, payload=b1)
        s2 = gtirb.Symbol(name="world", module=m, payload=b2)

        found = set(b1.references)
        self.assertEqual(found, {s1})

        found = set(b2.references)
        self.assertEqual(found, {s2})

        # Change the referent to verify we update the index
        s1.referent = b2
        found = set(b1.references)
        self.assertEqual(found, set())

        found = set(b2.references)
        self.assertEqual(found, {s1, s2})

        # Discard the symbol to verify we update the index
        m.symbols.discard(s1)
        found = set(b2.references)
        self.assertEqual(found, {s2})

        # Now add it back to verify we update the index
        m.symbols.add(s1)
        found = set(b2.references)
        self.assertEqual(found, {s1, s2})

        # Then set the payload to an integer to make sure we handle that right
        s1.value = 1
        s2.value = 1
        found = set(b2.references)
        self.assertEqual(found, set())


================================================
FILE: python/tests/test_blocks_at.py
================================================
# noqa: F841

import unittest

from helpers import SearchScope, create_interval_etc, parameterize_one

import gtirb


class BlocksAtTests(unittest.TestCase):
    @parameterize_one("scope", list(SearchScope))
    def test_blocks_at_simple(self, scope):
        ir, m, s, bi = create_interval_etc(address=0x1000, size=4)
        search_in = scope.select(ir, m, s, bi)

        code_block = gtirb.CodeBlock(offset=0, size=1, byte_interval=bi)
        code_block2 = gtirb.CodeBlock(offset=1, size=1, byte_interval=bi)

        found = set(search_in.byte_blocks_at(0x1000))
        self.assertEqual(found, {code_block})

        # Change the offset to verify we update the index
        code_block.offset = 2
        found = set(search_in.byte_blocks_at(0x1000))
        self.assertEqual(found, set())

        found = set(search_in.byte_blocks_at(0x1002))
        self.assertEqual(found, {code_block})

        # Discard the block to verify we update the index
        bi.blocks.discard(code_block)
        found = set(search_in.byte_blocks_at(0x1002))
        self.assertEqual(found, set())

        # Now add it back to verify we update the index
        bi.blocks.add(code_block)
        found = set(search_in.byte_blocks_at(0x1002))
        self.assertEqual(found, {code_block})

    @parameterize_one("scope", list(SearchScope))
    def test_blocks_at_zero(self, scope):
        ir, m, s, bi = create_interval_etc(address=0, size=4)
        search_in = scope.select(ir, m, s, bi)

        code_block = gtirb.CodeBlock(offset=0, size=3, byte_interval=bi)

        found = set(search_in.byte_blocks_at(0))
        self.assertEqual(found, {code_block})

    @parameterize_one("scope", list(SearchScope))
    def test_blocks_at_overlapping(self, scope):
        "Test that byte_blocks_at only looks at starting addresses"
        ir, m, s, bi = create_interval_etc(address=0x1000, size=4)
        search_in = scope.select(ir, m, s, bi)

        code_block = gtirb.CodeBlock(offset=0, size=1, byte_interval=bi)
        code_block2 = gtirb.CodeBlock(offset=0, size=2, byte_interval=bi)
        code_block3 = gtirb.CodeBlock(offset=1, size=1, byte_interval=bi)

        found = set(search_in.byte_blocks_at(0x1001))
        self.assertEqual(found, {code_block3})

    @parameterize_one("scope", list(SearchScope))
    def test_blocks_at_zero_sized(self, scope):
        "Test that byte_blocks_at can find zero-sized blocks"
        ir, m, s, bi = create_interval_etc(address=0x1000, size=4)
        search_in = scope.select(ir, m, s, bi)

        code_block = gtirb.CodeBlock(offset=0, size=1, byte_interval=bi)
        code_block2 = gtirb.CodeBlock(offset=1, size=0, byte_interval=bi)
        code_block3 = gtirb.CodeBlock(offset=1, size=1, byte_interval=bi)
        search_in = scope.select(ir, m, s, bi)

        found = set(search_in.byte_blocks_at(0x1001))
        self.assertEqual(found, {code_block2, code_block3})

    @parameterize_one("scope", list(SearchScope))
    def test_blocks_at_range(self, scope):
        "Test that byte_blocks_at works with ranges"
        ir, m, s, bi = create_interval_etc(address=0x1000, size=4)
        search_in = scope.select(ir, m, s, bi)

        code_block = gtirb.CodeBlock(offset=0, size=1, byte_interval=bi)
        code_block2 = gtirb.CodeBlock(offset=1, size=1, byte_interval=bi)
        code_block3 = gtirb.CodeBlock(offset=2, size=1, byte_interval=bi)

        found = set(search_in.byte_blocks_at(range(0x1000, 0x1001)))
        self.assertEqual(found, {code_block})

        found = set(search_in.byte_blocks_at(range(0x1001, 0x1003)))
        self.assertEqual(found, {code_block2, code_block3})

        # Now try with a range with a step to make sure that we actually
        # respect what the range tells us.
        found = set(search_in.byte_blocks_at(range(0x1000, 0x1004, 2)))
        self.assertEqual(found, {code_block, code_block3})

    @parameterize_one("scope", list(SearchScope))
    def test_blocks_at_no_address(self, scope):
        "Test that byte_blocks_at does nothing if we don't have an address"
        ir, m, s, bi = create_interval_etc(address=None, size=4)
        search_in = scope.select(ir, m, s, bi)

        code_block = gtirb.CodeBlock(offset=0, size=1, byte_interval=bi)
        code_block2 = gtirb.CodeBlock(offset=1, size=1, byte_interval=bi)

        found = set(search_in.byte_blocks_at(0x1000))
        self.assertEqual(found, set())

    @parameterize_one("scope", list(SearchScope))
    def test_code_blocks_at(self, scope):
        "Test that code_blocks_at only gives back CodeBlocks"
        ir, m, s, bi = create_interval_etc(address=0x1000, size=4)
        search_in = scope.select(ir, m, s, bi)

        code_block = gtirb.CodeBlock(offset=0, size=1, byte_interval=bi)
        data_block = gtirb.DataBlock(offset=0, size=1, byte_interval=bi)

        found = set(search_in.code_blocks_at(0x1000))
        self.assertEqual(found, {code_block})

    @parameterize_one("scope", list(SearchScope))
    def test_data_blocks_at(self, scope):
        "Test that data_blocks_at only gives back DataBlocks"
        ir, m, s, bi = create_interval_etc(address=0x1000, size=4)
        search_in = scope.select(ir, m, s, bi)

        code_block = gtirb.CodeBlock(offset=0, size=1, byte_interval=bi)
        data_block = gtirb.DataBlock(offset=0, size=1, byte_interval=bi)

        found = set(search_in.data_blocks_at(0x1000))
        self.assertEqual(found, {data_block})


class SectionBlocksAtTests(unittest.TestCase):
    def test_blocks_at_simple(self):
        s = gtirb.Section()

        bi1 = gtirb.ByteInterval(address=0x1000, size=4, section=s)
        bi1_block1 = gtirb.CodeBlock(offset=0, size=1, byte_interval=bi1)
        bi1_block2 = gtirb.CodeBlock(offset=1, size=1, byte_interval=bi1)

        bi2 = gtirb.ByteInterval(address=0x1004, size=4, section=s)
        bi2_block1 = gtirb.CodeBlock(offset=0, size=1, byte_interval=bi2)
        bi2_block2 = gtirb.CodeBlock(offset=1, size=1, byte_interval=bi2)

        found = set(s.byte_blocks_at(0x1000))
        self.assertEqual(found, {bi1_block1})

    def test_blocks_at_overlapping(self):
        "Test that we find the correct blocks if two byte intervals overlap"
        s = gtirb.Section()

        bi1 = gtirb.ByteInterval(address=0x1000, size=4, section=s)
        bi1_block1 = gtirb.CodeBlock(offset=0, size=1, byte_interval=bi1)
        bi1_block2 = gtirb.CodeBlock(offset=1, size=1, byte_interval=bi1)

        bi2 = gtirb.ByteInterval(address=0x1000, size=4, section=s)
        bi2_block1 = gtirb.CodeBlock(offset=0, size=1, byte_interval=bi2)
        bi2_block2 = gtirb.CodeBlock(offset=1, size=1, byte_interval=bi2)

        found = set(s.byte_blocks_at(0x1000))
        self.assertEqual(found, {bi1_block1, bi2_block1})

    def test_blocks_on_with_blocks_outside_bi(self):
        "Tests that we can handle byte intervals with blocks outside"
        s = gtirb.Section()

        bi1 = gtirb.ByteInterval(address=0x1000, size=1, section=s)
        bi1_block1 = gtirb.CodeBlock(offset=0, size=1, byte_interval=bi1)
        bi1_block2 = gtirb.CodeBlock(offset=1, size=1, byte_interval=bi1)

        found = set(s.byte_blocks_at(0x1000))
        self.assertEqual(found, {bi1_block1})

        # These blocks are outside of the byte interval's declared size, so
        # either interpretation is fair game.
        found = set(s.byte_blocks_at(0x1001))
        self.assertTrue(found == set() or found == {bi1_block2})


================================================
FILE: python/tests/test_blocks_at_offset.py
================================================
# noqa: F841

import unittest

from helpers import create_interval_etc

import gtirb


class BlocksAtOffsetTests(unittest.TestCase):
    def test_blocks_at_offset_simple(self):
        ir, m, s, bi = create_interval_etc(address=None, size=4)

        # Ensure we always have a couple blocks in the index beyond what we
        # are querying so that we don't just rebuild the tree from scratch
        # every time.
        code_block = gtirb.CodeBlock(offset=0, size=1, byte_interval=bi)
        code_block2 = gtirb.CodeBlock(offset=1, size=1, byte_interval=bi)
        code_block3 = gtirb.CodeBlock(offset=2, size=1, byte_interval=bi)

        found = set(bi.byte_blocks_at_offset(0))
        self.assertEqual(found, {code_block})

        # Change the offset to verify we update the index
        code_block.offset = 3
        found = set(bi.byte_blocks_at_offset(0))
        self.assertEqual(found, set())

        found = set(bi.byte_blocks_at_offset(3))
        self.assertEqual(found, {code_block})

        # Discard the block to verify we update the index
        bi.blocks.discard(code_block)
        found = set(bi.byte_blocks_at_offset(3))
        self.assertEqual(found, set())

        # Now add it back to verify we update the index
        bi.blocks.add(code_block)
        found = set(bi.byte_blocks_at_offset(3))
        self.assertEqual(found, {code_block})

    def test_blocks_at_offset_overlapping(self):
        "Test that byte_blocks_at_offset only looks at starting offsets"
        ir, m, s, bi = create_interval_etc(address=None, size=4)

        code_block = gtirb.CodeBlock(offset=0, size=1, byte_interval=bi)
        code_block2 = gtirb.CodeBlock(offset=0, size=2, byte_interval=bi)
        code_block3 = gtirb.CodeBlock(offset=1, size=1, byte_interval=bi)

        found = set(bi.byte_blocks_at_offset(1))
        self.assertEqual(found, {code_block3})

    def test_blocks_at_offset_zero_sized(self):
        "Test that byte_blocks_at_offset can find zero-sized blocks"
        ir, m, s, bi = create_interval_etc(address=None, size=4)

        code_block = gtirb.CodeBlock(offset=0, size=1, byte_interval=bi)
        code_block2 = gtirb.CodeBlock(offset=1, size=0, byte_interval=bi)
        code_block3 = gtirb.CodeBlock(offset=1, size=1, byte_interval=bi)

        found = set(bi.byte_blocks_at_offset(1))
        self.assertEqual(found, {code_block2, code_block3})

    def test_blocks_at_offset_range(self):
        "Test that byte_blocks_at_offset works with ranges"
        ir, m, s, bi = create_interval_etc(address=None, size=4)

        code_block = gtirb.CodeBlock(offset=0, size=1, byte_interval=bi)
        code_block2 = gtirb.CodeBlock(offset=1, size=1, byte_interval=bi)
        code_block3 = gtirb.CodeBlock(offset=2, size=1, byte_interval=bi)

        found = set(bi.byte_blocks_at_offset(range(0, 1)))
        self.assertEqual(found, {code_block})

        found = set(bi.byte_blocks_at_offset(range(1, 3)))
        self.assertEqual(found, {code_block2, code_block3})

        # Now try with a range with a step to make sure that we actually
        # respect what the range tells us.
        found = set(bi.byte_blocks_at_offset(range(0, 4, 2)))
        self.assertEqual(found, {code_block, code_block3})

    def test_code_blocks_at_offset(self):
        "Test that code_blocks_at_offset only gives back CodeBlocks"
        ir, m, s, bi = create_interval_etc(address=None, size=4)

        code_block = gtirb.CodeBlock(offset=0, size=1, byte_interval=bi)
        data_block = gtirb.DataBlock(offset=0, size=1, byte_interval=bi)

        found = set(bi.code_blocks_at_offset(0))
        self.assertEqual(found, {code_block})

    def test_data_blocks_at_offset(self):
        "Test that data_blocks_at_offset only gives back DataBlocks"
        ir, m, s, bi = create_interval_etc(address=None, size=4)

        code_block = gtirb.CodeBlock(offset=0, size=1, byte_interval=bi)
        data_block = gtirb.DataBlock(offset=0, size=1, byte_interval=bi)

        found = set(bi.data_blocks_at_offset(0))
        self.assertEqual(found, {data_block})


================================================
FILE: python/tests/test_blocks_on.py
================================================
import unittest

from helpers import SearchScope, create_interval_etc, parameterize_one

import gtirb


class BlocksOnTests(unittest.TestCase):
    @parameterize_one("scope", list(SearchScope))
    def test_blocks_on_simple(self, scope):
        ir, m, s, bi = create_interval_etc(address=0x1000, size=4)
        search_in = scope.select(ir, m, s, bi)

        code_block = gtirb.CodeBlock(offset=0, size=3, byte_interval=bi)
        code_block2 = gtirb.CodeBlock(offset=3, size=1, byte_interval=bi)

        found = set(search_in.byte_blocks_on(0x1001))
        self.assertEqual(found, {code_block})

        found = set(search_in.byte_blocks_on(0x1003))
        self.assertEqual(found, {code_block2})

        # Change the offset to verify we update the index
        code_block.offset = 2
        found = set(search_in.byte_blocks_on(0x1000))
        self.assertEqual(found, set())

        found = set(search_in.byte_blocks_on(0x1002))
        self.assertEqual(found, {code_block})

        # Discard the block to verify we update the index
        bi.blocks.discard(code_block)
        found = set(search_in.byte_blocks_on(0x1002))
        self.assertEqual(found, set())

        # Now add it back to verify we update the index
        bi.blocks.add(code_block)
        found = set(search_in.byte_blocks_on(0x1002))
        self.assertEqual(found, {code_block})

    @parameterize_one("scope", list(SearchScope))
    def test_blocks_on_zero(self, scope):
        ir, m, s, bi = create_interval_etc(address=0, size=4)
        search_in = scope.select(ir, m, s, bi)

        code_block = gtirb.CodeBlock(offset=0, size=3, byte_interval=bi)

        found = set(search_in.byte_blocks_on(0))
        self.assertEqual(found, {code_block})

    @parameterize_one("scope", list(SearchScope))
    def test_blocks_on_with_overlapping_blocks(self, scope):
        "Test that byte_blocks_on returns all blocks that overlap an address"
        ir, m, s, bi = create_interval_etc(address=0x1000, size=4)
        search_in = scope.select(ir, m, s, bi)

        code_block = gtirb.CodeBlock(offset=0, size=1, byte_interval=bi)
        code_block2 = gtirb.CodeBlock(offset=0, size=2, byte_interval=bi)
        code_block3 = gtirb.CodeBlock(offset=1, size=1, byte_interval=bi)

        found = set(search_in.byte_blocks_on(0x1001))
        self.assertEqual(found, {code_block2, code_block3})

    @parameterize_one("scope", list(SearchScope))
    def test_blocks_on_with_zero_sized_blocks(self, scope):
        "Test that byte_blocks_on doesn't find zero-sized blocks"
        ir, m, s, bi = create_interval_etc(address=0x1000, size=4)
        search_in = scope.select(ir, m, s, bi)

        code_block = gtirb.CodeBlock(offset=0, size=3, byte_interval=bi)
        code_block2 = gtirb.CodeBlock(offset=1, size=0, byte_interval=bi)
        code_block3 = gtirb.CodeBlock(offset=1, size=1, byte_interval=bi)

        found = set(search_in.byte_blocks_on(0x1001))
        self.assertEqual(found, {code_block, code_block3})

        found = set(search_in.byte_blocks_on(range(0x1001, 0x1002)))
        self.assertEqual(found, {code_block, code_block3})

    @parameterize_one("scope", list(SearchScope))
    def test_blocks_on_with_range(self, scope):
        "Test that byte_blocks_on handles ranges"
        ir, m, s, bi = create_interval_etc(address=0x1000, size=4)
        search_in = scope.select(ir, m, s, bi)

        code_block = gtirb.CodeBlock(offset=0, size=2, byte_interval=bi)
        code_block2 = gtirb.CodeBlock(offset=2, size=1, byte_interval=bi)
        code_block3 = gtirb.CodeBlock(offset=3, size=1, byte_interval=bi)

        found = set(search_in.byte_blocks_on(range(0x1000, 0x1004)))
        self.assertEqual(found, {code_block, code_block2, code_block3})

        found = set(search_in.byte_blocks_on(range(0x1002, 0x1002)))
        self.assertEqual(found, set())

        # Passing a different step doesn't make a ton of sense, but it should
        # work.
        found = set(search_in.byte_blocks_on(range(0x1000, 0x1004, 2)))
        self.assertEqual(found, {code_block, code_block2, code_block3})

    @parameterize_one("scope", list(SearchScope))
    def test_blocks_on_with_no_address(self, scope):
        "Test that byte_blocks_on does nothing if we don't have an address"
        ir, m, s, bi = create_interval_etc(address=None, size=4)
        search_in = scope.select(ir, m, s, bi)

        code_block = gtirb.CodeBlock(offset=0, size=2, byte_interval=bi)
        code_block2 = gtirb.CodeBlock(offset=2, size=1, byte_interval=bi)
        code_block3 = gtirb.CodeBlock(offset=3, size=1, byte_interval=bi)

        found = set(search_in.byte_blocks_on(range(0x1000, 0x1004)))
        self.assertEqual(found, set())

    @parameterize_one("scope", list(SearchScope))
    def test_code_blocks_on(self, scope):
        "Test that code_blocks_on only gives back CodeBlocks"
        ir, m, s, bi = create_interval_etc(address=0x1000, size=4)
        search_in = scope.select(ir, m, s, bi)

        code_block = gtirb.CodeBlock(offset=0, size=1, byte_interval=bi)
        data_block = gtirb.DataBlock(offset=1, size=1, byte_interval=bi)

        found = set(search_in.code_blocks_on(range(0x1000, 0x1004)))
        self.assertEqual(found, {code_block})

    @parameterize_one("scope", list(SearchScope))
    def test_data_blocks_on(self, scope):
        "Test that data_blocks_on only gives back DataBlocks"
        ir, m, s, bi = create_interval_etc(address=0x1000, size=4)
        search_in = scope.select(ir, m, s, bi)

        code_block = gtirb.CodeBlock(offset=0, size=1, byte_interval=bi)
        data_block = gtirb.DataBlock(offset=1, size=1, byte_interval=bi)

        found = set(search_in.data_blocks_on(range(0x1000, 0x1004)))
        self.assertEqual(found, {data_block})


class SectionBlocksOnTests(unittest.TestCase):
    def test_blocks_on_simple(self):
        s = gtirb.Section()

        bi1 = gtirb.ByteInterval(address=0x1000, size=4, section=s)
        bi1_block1 = gtirb.CodeBlock(offset=0, size=1, byte_interval=bi1)
        bi1_block2 = gtirb.CodeBlock(offset=1, size=1, byte_interval=bi1)

        bi2 = gtirb.ByteInterval(address=0x1004, size=4, section=s)
        bi2_block1 = gtirb.CodeBlock(offset=0, size=1, byte_interval=bi2)
        bi2_block2 = gtirb.CodeBlock(offset=1, size=1, byte_interval=bi2)

        found = set(s.byte_blocks_on(0x1001))
        self.assertEqual(found, {bi1_block2})

    def test_blocks_on_overlapping(self):
        "Test that we find the correct blocks if two byte intervals overlap"
        s = gtirb.Section()

        bi1 = gtirb.ByteInterval(address=0x1000, size=4, section=s)
        bi1_block1 = gtirb.CodeBlock(offset=0, size=1, byte_interval=bi1)
        bi1_block2 = gtirb.CodeBlock(offset=1, size=1, byte_interval=bi1)

        bi2 = gtirb.ByteInterval(address=0x1000, size=4, section=s)
        bi2_block1 = gtirb.CodeBlock(offset=0, size=1, byte_interval=bi2)
        bi2_block2 = gtirb.CodeBlock(offset=1, size=1, byte_interval=bi2)

        found = set(s.byte_blocks_on(0x1001))
        self.assertEqual(found, {bi1_block2, bi2_block2})

    def test_blocks_on_with_blocks_outside_bi(self):
        "Tests that we can handle byte intervals with blocks outside"
        s = gtirb.Section()

        bi1 = gtirb.ByteInterval(address=0x1000, size=1, section=s)
        bi1_block1 = gtirb.CodeBlock(offset=0, size=1, byte_interval=bi1)
        bi1_block2 = gtirb.CodeBlock(offset=1, size=1, byte_interval=bi1)

        found = set(s.byte_blocks_on(0x1000))
        self.assertEqual(found, {bi1_block1})

        # These blocks are outside of the byte interval's declared size, so
        # either interpretation is fair game.
        found = set(s.byte_blocks_on(0x1001))
        self.assertTrue(found == set() or found == {bi1_block2})


================================================
FILE: python/tests/test_blocks_on_offset.py
================================================
import unittest

from helpers import create_interval_etc

import gtirb


class BlocksOnOffsetTests(unittest.TestCase):
    def test_blocks_on_offset_simple(self):
        ir, m, s, bi = create_interval_etc(address=None, size=4)

        code_block = gtirb.CodeBlock(offset=0, size=3, byte_interval=bi)
        code_block2 = gtirb.CodeBlock(offset=3, size=1, byte_interval=bi)

        found = set(bi.byte_blocks_on_offset(1))
        self.assertEqual(found, {code_block})

        found = set(bi.byte_blocks_on_offset(3))
        self.assertEqual(found, {code_block2})

        # Change the offset to verify we update the index
        code_block.offset = 2
        found = set(bi.byte_blocks_on_offset(0))
        self.assertEqual(found, set())

        found = set(bi.byte_blocks_on_offset(2))
        self.assertEqual(found, {code_block})

        # Discard the block to verify we update the index
        bi.blocks.discard(code_block)
        found = set(bi.byte_blocks_on_offset(2))
        self.assertEqual(found, set())

        # Now add it back to verify we update the index
        bi.blocks.add(code_block)
        found = set(bi.byte_blocks_on_offset(2))
        self.assertEqual(found, {code_block})

    def test_blocks_on_offset_zero(self):
        ir, m, s, bi = create_interval_etc(address=None, size=4)

        code_block = gtirb.CodeBlock(offset=0, size=3, byte_interval=bi)

        found = set(bi.byte_blocks_on_offset(0))
        self.assertEqual(found, {code_block})

    def test_blocks_on_offset_with_overlapping_blocks(self):
        """
        Test that byte_blocks_on_offset returns all blocks that overlap an
        offset.
        """
        ir, m, s, bi = create_interval_etc(address=None, size=4)

        code_block = gtirb.CodeBlock(offset=0, size=1, byte_interval=bi)
        code_block2 = gtirb.CodeBlock(offset=0, size=2, byte_interval=bi)
        code_block3 = gtirb.CodeBlock(offset=1, size=1, byte_interval=bi)

        found = set(bi.byte_blocks_on_offset(1))
        self.assertEqual(found, {code_block2, code_block3})

    def test_blocks_on_offset_with_zero_sized_blocks(self):
        "Test that byte_blocks_on_offset doesn't find zero-sized blocks"
        ir, m, s, bi = create_interval_etc(address=None, size=4)

        code_block = gtirb.CodeBlock(offset=0, size=3, byte_interval=bi)
        code_block2 = gtirb.CodeBlock(offset=1, size=0, byte_interval=bi)
        code_block3 = gtirb.CodeBlock(offset=1, size=1, byte_interval=bi)

        found = set(bi.byte_blocks_on_offset(1))
        self.assertEqual(found, {code_block, code_block3})

        found = set(bi.byte_blocks_on_offset(range(1, 2)))
        self.assertEqual(found, {code_block, code_block3})

    def test_blocks_on_offset_with_range(self):
        "Test that byte_blocks_on_offset handles ranges"
        ir, m, s, bi = create_interval_etc(address=None, size=4)

        code_block = gtirb.CodeBlock(offset=0, size=2, byte_interval=bi)
        code_block2 = gtirb.CodeBlock(offset=2, size=1, byte_interval=bi)
        code_block3 = gtirb.CodeBlock(offset=3, size=1, byte_interval=bi)

        found = set(bi.byte_blocks_on_offset(range(0, 4)))
        self.assertEqual(found, {code_block, code_block2, code_block3})

        found = set(bi.byte_blocks_on_offset(range(2, 2)))
        self.assertEqual(found, set())

        # Passing a different step doesn't make a ton of sense, but it should
        # work.
        found = set(bi.byte_blocks_on_offset(range(0, 4, 2)))
        self.assertEqual(found, {code_block, code_block2, code_block3})

    def test_code_blocks_on_offset(self):
        "Test that code_blocks_on_offset only gives back CodeBlocks"
        ir, m, s, bi = create_interval_etc(address=None, size=4)

        code_block = gtirb.CodeBlock(offset=0, size=1, byte_interval=bi)
        data_block = gtirb.DataBlock(offset=1, size=1, byte_interval=bi)

        found = set(bi.code_blocks_on_offset(range(0, 4)))
        self.assertEqual(found, {code_block})

    def test_data_blocks_on_offset(self):
        "Test that data_blocks_on_offset only gives back DataBlocks"
        ir, m, s, bi = create_interval_etc(address=None, size=4)

        code_block = gtirb.CodeBlock(offset=0, size=1, byte_interval=bi)
        data_block = gtirb.DataBlock(offset=1, size=1, byte_interval=bi)

        found = set(bi.data_blocks_on_offset(range(0, 4)))
        self.assertEqual(found, {data_block})


================================================
FILE: python/tests/test_byte_intervals_at.py
================================================
import unittest

from helpers import SearchScope, parameterize_one

import gtirb


class ByteIntervalsAtTests(unittest.TestCase):
    @parameterize_one(
        "scope", (SearchScope.ir, SearchScope.module, SearchScope.section)
    )
    def test_byte_intervals_at(self, scope):
        ir = gtirb.IR()
        m = gtirb.Module(name="test", ir=ir)
        s = gtirb.Section(module=m)
        search_in = scope.select(ir, m, s, None)

        bi1 = gtirb.ByteInterval(address=0x1000, size=4, section=s)
        bi2 = gtirb.ByteInterval(address=0x1004, size=4, section=s)

        found = set(search_in.byte_intervals_at(0x1000))
        self.assertEqual(found, {bi1})

        found = set(search_in.byte_intervals_at(0x1001))
        self.assertEqual(found, set())

        found = set(search_in.byte_intervals_at(range(0x1000, 0x1008)))
        self.assertEqual(found, {bi1, bi2})

        found = set(search_in.byte_intervals_at(range(0x1000, 0x1008, 16)))
        self.assertEqual(found, {bi1})

        # Change the address to verify we update the index
        bi2.address = 0x2000

        found = set(search_in.byte_intervals_at(0x1004))
        self.assertEqual(found, set())

        found = set(search_in.byte_intervals_at(0x2000))
        self.assertEqual(found, {bi2})

        # Discard the interval to verify we update the index
        bi2.section = None

        found = set(search_in.byte_intervals_at(0x2000))
        self.assertEqual(found, set())

        # Now add it back to verify we update the index
        s.byte_intervals.add(bi2)
        found = set(search_in.byte_intervals_at(0x2000))
        self.assertEqual(found, {bi2})


================================================
FILE: python/tests/test_byte_intervals_on.py
================================================
import unittest

from helpers import SearchScope, parameterize_one

import gtirb


class ByteIntervalsOnTests(unittest.TestCase):
    @parameterize_one(
        "scope", (SearchScope.ir, SearchScope.module, SearchScope.section)
    )
    def test_byte_intervals_on(self, scope):
        ir = gtirb.IR()
        m = gtirb.Module(name="test", ir=ir)
        s = gtirb.Section(module=m)
        search_in = scope.select(ir, m, s, None)

        bi1 = gtirb.ByteInterval(address=0x1000, size=4, section=s)
        bi2 = gtirb.ByteInterval(address=0x1004, size=4, section=s)

        found = set(search_in.byte_intervals_on(0x1000))
        self.assertEqual(found, {bi1})

        found = set(search_in.byte_intervals_on(0x1001))
        self.assertEqual(found, {bi1})

        found = set(search_in.byte_intervals_on(range(0x1000, 0x1008)))
        self.assertEqual(found, {bi1, bi2})

        found = set(search_in.byte_intervals_on(range(0x1000, 0x1008, 16)))
        self.assertEqual(found, {bi1, bi2})

        # Change the address to verify we update the index
        bi2.address = 0x2000

        found = set(search_in.byte_intervals_on(0x1005))
        self.assertEqual(found, set())

        found = set(search_in.byte_intervals_on(0x2001))
        self.assertEqual(found, {bi2})

        # Discard the interval to verify we update the index
        bi2.section = None

        found = set(search_in.byte_intervals_on(0x2001))
        self.assertEqual(found, set())

        # Now add it back to verify we update the index
        s.byte_intervals.add(bi2)
        found = set(search_in.byte_intervals_on(0x2001))
        self.assertEqual(found, {bi2})

    @parameterize_one(
        "scope", [SearchScope.ir, SearchScope.module, SearchScope.section]
    )
    def test_byte_intervals_overlapping(self, scope):
        ir = gtirb.IR()
        m = gtirb.Module(name="test", ir=ir)
        s = gtirb.Section(module=m)
        search_in = scope.select(ir, m, s, None)

        bi1 = gtirb.ByteInterval(address=0x1000, size=8, section=s)
        bi2 = gtirb.ByteInterval(address=0x1004, size=4, section=s)

        found = set(search_in.byte_intervals_on(0x1005))
        self.assertEqual(found, {bi1, bi2})


================================================
FILE: python/tests/test_cfg.py
================================================
import unittest

import gtirb


class CFGTest(unittest.TestCase):
    def test_contains(self):
        b1, b2 = gtirb.ProxyBlock(), gtirb.ProxyBlock()
        cfg = gtirb.CFG(
            [gtirb.Edge(b1, b2, gtirb.Edge.Label(gtirb.Edge.Type.Branch))]
        )
        self.assertFalse(
            gtirb.Edge(gtirb.ProxyBlock(), gtirb.ProxyBlock()) in cfg
        )
        self.assertFalse(
            gtirb.Edge(b1, b2, gtirb.Edge.Label(gtirb.Edge.Type.Fallthrough))
            in cfg
        )
        self.assertTrue(
            gtirb.Edge(b1, b2, gtirb.Edge.Label(gtirb.Edge.Type.Branch)) in cfg
        )

    def test_add(self):
        b1, b2 = gtirb.ProxyBlock(), gtirb.ProxyBlock()
        cfg = gtirb.CFG()
        cfg.add(gtirb.Edge(b1, b2))
        cfg.add(gtirb.Edge(b1, b2))
        cfg.add(gtirb.Edge(b1, b2, gtirb.Edge.Label(gtirb.Edge.Type.Branch)))
        self.assertEqual(len(cfg), 2)
        self.assertTrue(gtirb.Edge(b1, b2) in cfg)
        self.assertTrue(
            gtirb.Edge(b1, b2, gtirb.Edge.Label(gtirb.Edge.Type.Branch)) in cfg
        )

    def test_clear(self):
        cfg = gtirb.CFG(
            [
                gtirb.Edge(gtirb.ProxyBlock(), gtirb.ProxyBlock()),
                gtirb.Edge(
                    gtirb.CodeBlock(offset=0, size=1),
                    gtirb.CodeBlock(offset=1, size=2),
                ),
            ]
        )
        self.assertEqual(len(cfg), 2)

        cfg.clear()
        self.assertEqual(len(cfg), 0)

    def test_discard(self):
        b1, b2 = gtirb.ProxyBlock(), gtirb.CodeBlock(offset=0, size=1)
        cfg = gtirb.CFG(
            [
                gtirb.Edge(b1, b2),
                gtirb.Edge(
                    gtirb.ProxyBlock(), gtirb.CodeBlock(offset=1, size=2)
                ),
            ]
        )
        self.assertEqual(len(cfg), 2)

        cfg.discard(gtirb.Edge(b1, b2))
        self.assertEqual(len(cfg), 1)
        self.assertFalse(gtirb.Edge(b1, b2) in cfg)

        cfg.discard(gtirb.Edge(b1, b2))
        self.assertEqual(len(cfg), 1)
        self.assertFalse(gtirb.Edge(b1, b2) in cfg)

    def test_out_edges(self):
        b1, b2, b3 = gtirb.ProxyBlock(), gtirb.ProxyBlock(), gtirb.ProxyBlock()
        b4 = gtirb.CodeBlock(offset=0, size=1)
        cfg = gtirb.CFG(
            [
                gtirb.Edge(
                    b1, b2, gtirb.Edge.Label(gtirb.Edge.Type.Fallthrough)
                ),
                gtirb.Edge(b1, b2, gtirb.Edge.Label(gtirb.Edge.Type.Branch)),
                gtirb.Edge(b3, b2),
            ]
        )
        self.assertEqual(sum(1 for _ in cfg.out_edges(b1)), 2)
        self.assertEqual(sum(1 for _ in cfg.out_edges(b2)), 0)
        self.assertEqual(sum(1 for _ in cfg.out_edges(b3)), 1)
        self.assertEqual(sum(1 for _ in cfg.out_edges(b4)), 0)

    def test_in_edges(self):
        b1, b2, b3 = gtirb.ProxyBlock(), gtirb.ProxyBlock(), gtirb.ProxyBlock()
        b4 = gtirb.CodeBlock(offset=0, size=1)
        cfg = gtirb.CFG(
            [
                gtirb.Edge(
                    b1, b2, gtirb.Edge.Label(gtirb.Edge.Type.Fallthrough)
                ),
                gtirb.Edge(b3, b2, gtirb.Edge.Label(gtirb.Edge.Type.Branch)),
                gtirb.Edge(b1, b3),
            ]
        )
        self.assertEqual(sum(1 for _ in cfg.in_edges(b1)), 0)
        self.assertEqual(sum(1 for _ in cfg.in_edges(b2)), 2)
        self.assertEqual(sum(1 for _ in cfg.in_edges(b3)), 1)
        self.assertEqual(sum(1 for _ in cfg.in_edges(b4)), 0)

    def test_nx(self):
        b1, b2 = gtirb.ProxyBlock(), gtirb.ProxyBlock()
        cfg = gtirb.CFG(
            [gtirb.Edge(b1, b2, gtirb.Edge.Label(gtirb.Edge.Type.Call))]
        )
        for n1, n2, lab in cfg.nx().edges(data="label"):
            self.assertEqual(n1, b1)
            self.assertEqual(n2, b2)
            self.assertEqual(lab, gtirb.Edge.Label(gtirb.Edge.Type.Call))


================================================
FILE: python/tests/test_deep_eq.py
================================================
import unittest
import uuid

import gtirb


class DeepEqTest(unittest.TestCase):
    def test_code_block(self):
        id1 = uuid.uuid4()
        id2 = uuid.uuid4()

        b1 = gtirb.CodeBlock(size=1, decode_mode=2, offset=3, uuid=id1)
        b2 = gtirb.CodeBlock(size=1, decode_mode=2, offset=3, uuid=id1)
        self.assertTrue(b1.deep_eq(b2))

        b2 = gtirb.CodeBlock(size=5, decode_mode=2, offset=3, uuid=id1)
        self.assertFalse(b1.deep_eq(b2))

        b2 = gtirb.CodeBlock(size=1, decode_mode=5, offset=3, uuid=id1)
        self.assertFalse(b1.deep_eq(b2))

        b2 = gtirb.CodeBlock(size=1, decode_mode=2, offset=5, uuid=id1)
        self.assertFalse(b1.deep_eq(b2))

        b2 = gtirb.CodeBlock(size=1, decode_mode=2, offset=3, uuid=id2)
        self.assertFalse(b1.deep_eq(b2))

    def test_data_block(self):
        id1 = uuid.uuid4()
        id2 = uuid.uuid4()

        b1 = gtirb.DataBlock(size=1, offset=3, uuid=id1)
        b2 = gtirb.DataBlock(size=1, offset=3, uuid=id1)
        self.assertTrue(b1.deep_eq(b2))

        b2 = gtirb.DataBlock(size=5, offset=3, uuid=id1)
        self.assertFalse(b1.deep_eq(b2))

        b2 = gtirb.DataBlock(size=1, offset=5, uuid=id1)
        self.assertFalse(b1.deep_eq(b2))

        b2 = gtirb.DataBlock(size=1, offset=3, uuid=id2)
        self.assertFalse(b1.deep_eq(b2))

    def test_proxy_blocks(self):
        id1 = uuid.uuid4()
        id2 = uuid.uuid4()

        b1 = gtirb.ProxyBlock(uuid=id1)
        b2 = gtirb.ProxyBlock(uuid=id1)
        self.assertTrue(b1.deep_eq(b2))

        b2 = gtirb.ProxyBlock(uuid=id2)
        self.assertFalse(b1.deep_eq(b2))

    def test_symbol(self):
        id1 = uuid.uuid4()
        id2 = uuid.uuid4()

        s1 = gtirb.Symbol(name="name", payload=None, uuid=id1)
        s2 = gtirb.Symbol(name="name", payload=None, uuid=id1)
        self.assertTrue(s1.deep_eq(s2))

        s1 = gtirb.Symbol(name="name", payload=5, uuid=id1)
        s2 = gtirb.Symbol(name="name", payload=5, uuid=id1)
        self.assertTrue(s1.deep_eq(s2))

        s1 = gtirb.Symbol(
            name="name",
            payload=gtirb.CodeBlock(size=1, decode_mode=2, offset=3, uuid=id1),
            uuid=id1,
        )
        s2 = gtirb.Symbol(
            name="name",
            payload=gtirb.CodeBlock(size=1, decode_mode=2, offset=3, uuid=id1),
            uuid=id1,
        )
        self.assertTrue(s1.deep_eq(s2))

        s1 = gtirb.Symbol(name="name1", payload=None, uuid=id1)
        s2 = gtirb.Symbol(name="name2", payload=None, uuid=id1)
        self.assertFalse(s1.deep_eq(s2))

        s1 = gtirb.Symbol(name="name", payload=None, uuid=id1)
        s2 = gtirb.Symbol(name="name", payload=5, uuid=id1)
        self.assertFalse(s1.deep_eq(s2))

        s1 = gtirb.Symbol(
            name="name",
            payload=gtirb.CodeBlock(size=1, decode_mode=2, offset=3, uuid=id1),
            uuid=id1,
        )
        s2 = gtirb.Symbol(
            name="name",
            payload=gtirb.CodeBlock(size=2, decode_mode=2, offset=3, uuid=id1),
            uuid=id1,
        )
        self.assertFalse(s1.deep_eq(s2))

        s1 = gtirb.Symbol(name="name", payload=None, uuid=id1)
        s2 = gtirb.Symbol(name="name", payload=None, uuid=id2)
        self.assertFalse(s1.deep_eq(s2))

    def test_sym_exprs(self):
        id1 = uuid.uuid4()
        id2 = uuid.uuid4()

        # SymAddrConst
        s1 = gtirb.SymAddrConst(
            offset=1,
            symbol=gtirb.Symbol(name="name", payload=None, uuid=id1),
            attributes={gtirb.SymbolicExpression.Attribute.G1},
        )
        s2 = gtirb.SymAddrConst(
            offset=1,
            symbol=gtirb.Symbol(name="name", payload=None, uuid=id1),
            attributes={gtirb.SymbolicExpression.Attribute.G1},
        )
        self.assertTrue(s1.deep_eq(s2))

        s1 = gtirb.SymAddrConst(
            offset=1, symbol=gtirb.Symbol(name="name", payload=None, uuid=id1)
        )
        s2 = gtirb.SymAddrConst(
            offset=2, symbol=gtirb.Symbol(name="name", payload=None, uuid=id1)
        )
        self.assertFalse(s1.deep_eq(s2))

        s1 = gtirb.SymAddrConst(
            offset=1, symbol=gtirb.Symbol(name="name1", payload=None, uuid=id1)
        )
        s2 = gtirb.SymAddrConst(
            offset=1, symbol=gtirb.Symbol(name="name2", payload=None, uuid=id1)
        )
        self.assertFalse(s1.deep_eq(s2))

        s1 = gtirb.SymAddrConst(
            offset=1,
            symbol=gtirb.Symbol(name="name", payload=None, uuid=id1),
            attributes={gtirb.SymbolicExpression.Attribute.G1},
        )
        s2 = gtirb.SymAddrConst(
            offset=1,
            symbol=gtirb.Symbol(name="name", payload=None, uuid=id1),
        )
        self.assertFalse(s1.deep_eq(s2))

        # SymAddrAddr
        s1 = gtirb.SymAddrAddr(
            offset=1,
            scale=2,
            symbol1=gtirb.Symbol(name="name1", payload=None, uuid=id1),
            symbol2=gtirb.Symbol(name="name2", payload=None, uuid=id2),
            attributes={gtirb.SymbolicExpression.Attribute.G1},
        )
        s2 = gtirb.SymAddrAddr(
            offset=1,
            scale=2,
            symbol1=gtirb.Symbol(name="name1", payload=None, uuid=id1),
            symbol2=gtirb.Symbol(name="name2", payload=None, uuid=id2),
            attributes={gtirb.SymbolicExpression.Attribute.G1},
        )
        self.assertTrue(s1.deep_eq(s2))

        s1 = gtirb.SymAddrAddr(
            offset=1,
            scale=2,
            symbol1=gtirb.Symbol(name="name1", payload=None, uuid=id1),
            symbol2=gtirb.Symbol(name="name2", payload=None, uuid=id2),
        )
        s2 = gtirb.SymAddrAddr(
            offset=2,
            scale=2,
            symbol1=gtirb.Symbol(name="name1", payload=None, uuid=id1),
            symbol2=gtirb.Symbol(name="name2", payload=None, uuid=id2),
        )
        self.assertFalse(s1.deep_eq(s2))

        s1 = gtirb.SymAddrAddr(
            offset=1,
            scale=2,
            symbol1=gtirb.Symbol(name="name1", payload=None, uuid=id1),
            symbol2=gtirb.Symbol(name="name2", payload=None, uuid=id2),
        )
        s2 = gtirb.SymAddrAddr(
            offset=1,
            scale=4,
            symbol1=gtirb.Symbol(name="name1", payload=None, uuid=id1),
            symbol2=gtirb.Symbol(name="name2", payload=None, uuid=id2),
        )
        self.assertFalse(s1.deep_eq(s2))

        s1 = gtirb.SymAddrAddr(
            offset=1,
            scale=2,
            symbol1=gtirb.Symbol(name="name1", payload=None, uuid=id1),
            symbol2=gtirb.Symbol(name="name2", payload=None, uuid=id2),
        )
        s2 = gtirb.SymAddrAddr(
            offset=1,
            scale=2,
            symbol1=gtirb.Symbol(name="name3", payload=None, uuid=id1),
            symbol2=gtirb.Symbol(name="name2", payload=None, uuid=id2),
        )
        self.assertFalse(s1.deep_eq(s2))

        s1 = gtirb.SymAddrAddr(
            offset=1,
            scale=2,
            symbol1=gtirb.Symbol(name="name1", payload=None, uuid=id1),
            symbol2=gtirb.Symbol(name="name2", payload=None, uuid=id2),
        )
        s2 = gtirb.SymAddrAddr(
            offset=1,
            scale=2,
            symbol1=gtirb.Symbol(name="name1", payload=None, uuid=id1),
            symbol2=gtirb.Symbol(name="name3", payload=None, uuid=id2),
        )
        self.assertFalse(s1.deep_eq(s2))

        s1 = gtirb.SymAddrAddr(
            offset=1,
            scale=2,
            symbol1=gtirb.Symbol(name="name1", payload=None, uuid=id1),
            symbol2=gtirb.Symbol(name="name2", payload=None, uuid=id2),
            attributes={gtirb.SymbolicExpression.Attribute.G1},
        )
        s2 = gtirb.SymAddrAddr(
            offset=1,
            scale=2,
            symbol1=gtirb.Symbol(name="name1", payload=None, uuid=id1),
            symbol2=gtirb.Symbol(name="name2", payload=None, uuid=id2),
        )
        self.assertFalse(s1.deep_eq(s2))

    def test_byte_intervals(self):
        id1 = uuid.uuid4()
        id2 = uuid.uuid4()
        id3 = uuid.uuid4()
        id4 = uuid.uuid4()
        id6 = uuid.uuid4()

        b1 = gtirb.ByteInterval(
            address=1,
            contents=b"abcd",
            size=4,
            initialized_size=4,
            blocks=(
                gtirb.DataBlock(size=1, offset=3, uuid=id2),
                gtirb.CodeBlock(size=1, decode_mode=2, offset=3, uuid=id3),
            ),
            symbolic_expressions={
                2: gtirb.SymAddrConst(
                    3, gtirb.Symbol(name="name1", payload=4, uuid=id4)
                ),
            },
            uuid=id1,
        )
        b2 = gtirb.ByteInterval(
            address=1,
            contents=b"abcd",
            size=4,
            initialized_size=4,
            blocks=(
                gtirb.DataBlock(size=1, offset=3, uuid=id2),
                gtirb.CodeBlock(size=1, decode_mode=2, offset=3, uuid=id3),
            ),
            symbolic_expressions={
                2: gtirb.SymAddrConst(
                    3, gtirb.Symbol(name="name1", payload=4, uuid=id4)
                ),
            },
            uuid=id1,
        )
        self.assertTrue(b1.deep_eq(b2))

        b2 = gtirb.ByteInterval(
            address=None,
            contents=b"abcd",
            size=4,
            initialized_size=4,
            blocks=(
                gtirb.DataBlock(size=1, offset=3, uuid=id2),
                gtirb.CodeBlock(size=1, decode_mode=2, offset=3, uuid=id3),
            ),
            symbolic_expressions={
                2: gtirb.SymAddrConst(
                    3, gtirb.Symbol(name="name1", payload=4, uuid=id4)
                ),
            },
            uuid=id1,
        )
        self.assertFalse(b1.deep_eq(b2))

        b2 = gtirb.ByteInterval(
            address=1,
            contents=b"1234",
            size=4,
            initialized_size=4,
            blocks=(
                gtirb.DataBlock(size=1, offset=3, uuid=id2),
                gtirb.CodeBlock(size=1, decode_mode=2, offset=3, uuid=id3),
            ),
            symbolic_expressions={
                2: gtirb.SymAddrConst(
                    3, gtirb.Symbol(name="name1", payload=4, uuid=id4)
                ),
            },
            uuid=id1,
        )
        self.assertFalse(b1.deep_eq(b2))

        b2 = gtirb.ByteInterval(
            address=1,
            contents=b"abcd",
            size=8,
            initialized_size=4,
            blocks=(
                gtirb.DataBlock(size=1, offset=3, uuid=id2),
                gtirb.CodeBlock(size=1, decode_mode=2, offset=3, uuid=id3),
            ),
            symbolic_expressions={
                2: gtirb.SymAddrConst(
                    3, gtirb.Symbol(name="name1", payload=4, uuid=id4)
                ),
            },
            uuid=id1,
        )
        self.assertFalse(b1.deep_eq(b2))

        b2 = gtirb.ByteInterval(
            address=1,
            contents=b"abcd",
            size=4,
            initialized_size=0,
            blocks=(
                gtirb.DataBlock(size=1, offset=3, uuid=id2),
                gtirb.CodeBlock(size=1, decode_mode=2, offset=3, uuid=id3),
            ),
            symbolic_expressions={
                2: gtirb.SymAddrConst(
                    3, gtirb.Symbol(name="name1", payload=4, uuid=id4)
                ),
            },
            uuid=id1,
        )
        self.assertFalse(b1.deep_eq(b2))

        b2 = gtirb.ByteInterval(
            address=1,
            contents=b"abcd",
            size=4,
            initialized_size=4,
            blocks=(
                gtirb.DataBlock(size=1, offset=3, uuid=id2),
                gtirb.CodeBlock(size=1, decode_mode=5, offset=3, uuid=id3),
            ),
            symbolic_expressions={
                2: gtirb.SymAddrConst(
                    3, gtirb.Symbol(name="name1", payload=4, uuid=id4)
                ),
            },
            uuid=id1,
        )
        self.assertFalse(b1.deep_eq(b2))

        b2 = gtirb.ByteInterval(
            address=1,
            contents=b"abcd",
            size=4,
            initialized_size=4,
            blocks=(
                gtirb.CodeBlock(size=1, decode_mode=2, offset=3, uuid=id3),
            ),
            symbolic_expressions={
                2: gtirb.SymAddrConst(
                    3, gtirb.Symbol(name="name1", payload=4, uuid=id4)
                ),
            },
            uuid=id1,
        )
        self.assertFalse(b1.deep_eq(b2))

        b2 = gtirb.ByteInterval(
            address=1,
            contents=b"abcd",
            size=4,
            initialized_size=4,
            blocks=(
                gtirb.DataBlock(size=1, offset=3, uuid=id2),
                gtirb.CodeBlock(size=1, decode_mode=2, offset=3, uuid=id3),
            ),
            symbolic_expressions={
                2: gtirb.SymAddrConst(
                    6, gtirb.Symbol(name="name1", payload=4, uuid=id4)
                ),
            },
            uuid=id1,
        )
        self.assertFalse(b1.deep_eq(b2))

        b2 = gtirb.ByteInterval(
            address=1,
            contents=b"abcd",
            size=4,
            initialized_size=4,
            blocks=(
                gtirb.DataBlock(size=1, offset=3, uuid=id2),
                gtirb.CodeBlock(size=1, decode_mode=2, offset=3, uuid=id3),
            ),
            symbolic_expressions={
                2: gtirb.SymAddrConst(
                    3, gtirb.Symbol(name="name1", payload=4, uuid=id4)
                )
            },
            uuid=id1,
        )
        self.assertTrue(b1.deep_eq(b2))

        b2 = gtirb.ByteInterval(
            address=1,
            contents=b"abcd",
            size=4,
            initialized_size=4,
            blocks=(
                gtirb.DataBlock(size=1, offset=3, uuid=id2),
                gtirb.CodeBlock(size=1, decode_mode=2, offset=3, uuid=id3),
            ),
            symbolic_expressions={
                7: gtirb.SymAddrConst(
                    3, gtirb.Symbol(name="name1", payload=4, uuid=id4)
                ),
            },
            uuid=id1,
        )
        self.assertFalse(b1.deep_eq(b2))

        b2 = gtirb.ByteInterval(
            address=1,
            contents=b"abcd",
            size=4,
            initialized_size=4,
            blocks=(
                gtirb.DataBlock(size=1, offset=3, uuid=id2),
                gtirb.CodeBlock(size=1, decode_mode=2, offset=3, uuid=id3),
            ),
            symbolic_expressions={
                2: gtirb.SymAddrConst(
                    3, gtirb.Symbol(name="name1", payload=4, uuid=id4)
                ),
            },
            uuid=id6,
        )
        self.assertFalse(b1.deep_eq(b2))

    def test_sections(self):
        id1 = uuid.uuid4()
        id2 = uuid.uuid4()
        id3 = uuid.uuid4()
        id4 = uuid.uuid4()

        s1 = gtirb.Section(
            name="name",
            byte_intervals=(
                gtirb.ByteInterval(contents=b"abcd", uuid=id2),
                gtirb.ByteInterval(contents=b"1234", uuid=id3),
            ),
            flags=(gtirb.Section.Flag.Readable, gtirb.Section.Flag.Writable),
            uuid=id1,
        )
        s2 = gtirb.Section(
            name="name",
            byte_intervals=(
                gtirb.ByteInterval(contents=b"abcd", uuid=id2),
                gtirb.ByteInterval(contents=b"1234", uuid=id3),
            ),
            flags=(gtirb.Section.Flag.Readable, gtirb.Section.Flag.Writable),
            uuid=id1,
        )
        self.assertTrue(s1.deep_eq(s2))

        s2 = gtirb.Section(
            name="name2",
            byte_intervals=(
                gtirb.ByteInterval(contents=b"abcd", uuid=id2),
                gtirb.ByteInterval(contents=b"1234", uuid=id3),
            ),
            flags=(gtirb.Section.Flag.Readable, gtirb.Section.Flag.Writable),
            uuid=id1,
        )
        self.assertFalse(s1.deep_eq(s2))

        s2 = gtirb.Section(
            name="name",
            byte_intervals=(
                gtirb.ByteInterval(contents=b"abcd", uuid=id2),
                gtirb.ByteInterval(contents=b"12345", uuid=id3),
            ),
            flags=(gtirb.Section.Flag.Readable, gtirb.Section.Flag.Writable),
            uuid=id1,
        )
        self.assertFalse(s1.deep_eq(s2))

        s2 = gtirb.Section(
            name="name",
            byte_intervals=(gtirb.ByteInterval(contents=b"abcd", uuid=id2),),
            flags=(gtirb.Section.Flag.Readable, gtirb.Section.Flag.Writable),
            uuid=id1,
        )
        self.assertFalse(s1.deep_eq(s2))

        s2 = gtirb.Section(
            name="name",
            byte_intervals=(
                gtirb.ByteInterval(contents=b"abcd", uuid=id2),
                gtirb.ByteInterval(contents=b"1234", uuid=id3),
            ),
            flags=(gtirb.Section.Flag.Writable,),
            uuid=id1,
        )
        self.assertFalse(s1.deep_eq(s2))

        s2 = gtirb.Section(
            name="name",
            byte_intervals=(
                gtirb.ByteInterval(contents=b"abcd", uuid=id2),
                gtirb.ByteInterval(contents=b"1234", uuid=id3),
            ),
            flags=(
                gtirb.Section.Flag.Readable,
                gtirb.Section.Flag.Writable,
                gtirb.Section.Flag.Loaded,
            ),
            uuid=id1,
        )
        self.assertFalse(s1.deep_eq(s2))

        s2 = gtirb.Section(
            name="name",
            byte_intervals=(
                gtirb.ByteInterval(contents=b"abcd", uuid=id2),
                gtirb.ByteInterval(contents=b"1234", uuid=id3),
            ),
            flags=(gtirb.Section.Flag.Readable, gtirb.Section.Flag.Writable),
            uuid=id4,
        )
        self.assertFalse(s1.deep_eq(s2))

    def test_cfg(self):
        id1 = uuid.uuid4()
        id2 = uuid.uuid4()

        e1 = gtirb.CFG(
            [
                gtirb.Edge(
                    gtirb.CodeBlock(size=1, uuid=id1),
                    gtirb.CodeBlock(size=2, uuid=id2),
                    gtirb.Edge.Label(
                        type=gtirb.Edge.Type.Branch,
                        conditional=True,
                        direct=False,
                    ),
                )
            ]
        )
        self.assertFalse(
            e1.deep_eq(
                [
                    gtirb.Edge(
                        gtirb.CodeBlock(size=1, uuid=id1),
                        gtirb.CodeBlock(size=2, uuid=id2),
                        gtirb.Edge.Label(
                            type=gtirb.Edge.Type.Branch,
                            conditional=True,
                            direct=False,
                        ),
                    )
                ]
            )
        )

        e2 = gtirb.CFG(
            [
                gtirb.Edge(
                    gtirb.CodeBlock(size=1, uuid=id1),
                    gtirb.CodeBlock(size=2, uuid=id2),
                    gtirb.Edge.Label(
                        type=gtirb.Edge.Type.Branch,
                        conditional=True,
                        direct=False,
                    ),
                )
            ]
        )
        self.assertTrue(e1.deep_eq(e2))

        e2 = gtirb.CFG(
            [
                gtirb.Edge(
                    gtirb.CodeBlock(size=3, uuid=id1),
                    gtirb.CodeBlock(size=2, uuid=id2),
                    gtirb.Edge.Label(
                        type=gtirb.Edge.Type.Branch,
                        conditional=True,
                        direct=False,
                    ),
                )
            ]
        )
        self.assertFalse(e1.deep_eq(e2))

        e2 = gtirb.CFG(
            [
                gtirb.Edge(
                    gtirb.CodeBlock(size=1, uuid=id1),
                    gtirb.CodeBlock(size=3, uuid=id2),
                    gtirb.Edge.Label(
                        type=gtirb.Edge.Type.Branch,
                        conditional=True,
                        direct=False,
                    ),
                )
            ]
        )
        self.assertFalse(e1.deep_eq(e2))

        e2 = gtirb.CFG(
            [
                gtirb.Edge(
                    gtirb.CodeBlock(size=1, uuid=id1),
                    gtirb.CodeBlock(size=2, uuid=id2),
                    gtirb.Edge.Label(
                        type=gtirb.Edge.Type.Fallthrough,
                        conditional=True,
                        direct=False,
                    ),
                )
            ]
        )
        self.assertFalse(e1.deep_eq(e2))

        e2 = gtirb.CFG(
            [
                gtirb.Edge(
                    gtirb.CodeBlock(size=1, uuid=id1),
                    gtirb.CodeBlock(size=2, uuid=id2),
                    gtirb.Edge.Label(
                        type=gtirb.Edge.Type.Branch,
                        conditional=False,
                        direct=False,
                    ),
                )
            ]
        )
        self.assertFalse(e1.deep_eq(e2))

        e2 = gtirb.CFG(
            [
                gtirb.Edge(
                    gtirb.CodeBlock(size=1, uuid=id1),
                    gtirb.CodeBlock(size=2, uuid=id2),
                    gtirb.Edge.Label(
                        type=gtirb.Edge.Type.Branch,
                        conditional=True,
                        direct=True,
                    ),
                )
            ]
        )
        self.assertFalse(e1.deep_eq(e2))

    def test_module(self):
        id1 = uuid.uuid4()
        id2 = uuid.uuid4()
        id3 = uuid.uuid4()
        id4 = uuid.uuid4()
        id5 = uuid.uuid4()
        id6 = uuid.uuid4()
        id7 = uuid.uuid4()
        id8 = uuid.uuid4()

        m1 = gtirb.Module(
            aux_data={"key": gtirb.AuxData("value", "string")},
            binary_path="binary_path",
            file_format=gtirb.Module.FileFormat.ELF,
            isa=gtirb.Module.ISA.X64,
            name="name",
            preferred_addr=1,
            rebase_delta=2,
            entry_point=gtirb.CodeBlock(size=1, uuid=id2),
            proxies=(gtirb.ProxyBlock(uuid=id3), gtirb.ProxyBlock(uuid=id4)),
            symbols=(
                gtirb.Symbol(name="sym1", uuid=id5),
                gtirb.Symbol(name="sym2", uuid=id6),
            ),
            sections=(
                gtirb.Section(name="sect1", uuid=id7),
                gtirb.Section(name="sect2", uuid=id8),
            ),
            uuid=id1,
        )
        m2 = gtirb.Module(
            aux_data={"key": gtirb.AuxData("value", "string")},
            binary_path="binary_path",
            file_format=gtirb.Module.FileFormat.ELF,
            isa=gtirb.Module.ISA.X64,
            name="name",
            preferred_addr=1,
            rebase_delta=2,
            entry_point=gtirb.CodeBlock(size=1, uuid=id2),
            proxies=(gtirb.ProxyBlock(uuid=id3), gtirb.ProxyBlock(uuid=id4)),
            symbols=(
                gtirb.Symbol(name="sym1", uuid=id5),
                gtirb.Symbol(name="sym2", uuid=id6),
            ),
            sections=(
                gtirb.Section(name="sect1", uuid=id7),
                gtirb.Section(name="sect2", uuid=id8),
            ),
            uuid=id1,
        )
        self.assertTrue(m1.deep_eq(m2))

        m2 = gtirb.Module(
            aux_data={"key": gtirb.AuxData("other_value", "string")},
            binary_path="binary_path",
            file_format=gtirb.Module.FileFormat.ELF,
            isa=gtirb.Module.ISA.X64,
            name="name",
            preferred_addr=1,
            rebase_delta=2,
            entry_point=gtirb.CodeBlock(size=1, uuid=id2),
            proxies=(gtirb.ProxyBlock(uuid=id3), gtirb.ProxyBlock(uuid=id4)),
            symbols=(
                gtirb.Symbol(name="sym1", uuid=id5),
                gtirb.Symbol(name="sym2", uuid=id6),
            ),
            sections=(
                gtirb.Section(name="sect1", uuid=id7),
                gtirb.Section(name="sect2", uuid=id8),
            ),
            uuid=id1,
        )
        self.assertTrue(m1.deep_eq(m2))

        m2 = gtirb.Module(
            aux_data={"key": gtirb.AuxData("value", "string")},
            binary_path="other_binary_path",
            file_format=gtirb.Module.FileFormat.ELF,
            isa=gtirb.Module.ISA.X64,
            name="name",
            preferred_addr=1,
            rebase_delta=2,
            entry_point=gtirb.CodeBlock(size=1, uuid=id2),
            proxies=(gtirb.ProxyBlock(uuid=id3), gtirb.ProxyBlock(uuid=id4)),
            symbols=(
                gtirb.Symbol(name="sym1", uuid=id5),
                gtirb.Symbol(name="sym2", uuid=id6),
            ),
            sections=(
                gtirb.Section(name="sect1", uuid=id7),
                gtirb.Section(name="sect2", uuid=id8),
            ),
            uuid=id1,
        )
        self.assertFalse(m1.deep_eq(m2))

        m2 = gtirb.Module(
            aux_data={"key": gtirb.AuxData("value", "string")},
            binary_path="binary_path",
            file_format=gtirb.Module.FileFormat.PE,
            isa=gtirb.Module.ISA.X64,
            name="name",
            preferred_addr=1,
            rebase_delta=2,
            entry_point=gtirb.CodeBlock(size=1, uuid=id2),
            proxies=(gtirb.ProxyBlock(uuid=id3), gtirb.ProxyBlock(uuid=id4)),
            symbols=(
                gtirb.Symbol(name="sym1", uuid=id5),
                gtirb.Symbol(name="sym2", uuid=id6),
            ),
            sections=(
                gtirb.Section(name="sect1", uuid=id7),
                gtirb.Section(name="sect2", uuid=id8),
            ),
            uuid=id1,
        )
        self.assertFalse(m1.deep_eq(m2))

        m2 = gtirb.Module(
            aux_data={"key": gtirb.AuxData("value", "string")},
            binary_path="binary_path",
            file_format=gtirb.Module.FileFormat.ELF,
            isa=gtirb.Module.ISA.ARM,
            name="name",
            preferred_addr=1,
            rebase_delta=2,
            entry_point=gtirb.CodeBlock(size=1, uuid=id2),
            proxies=(gtirb.ProxyBlock(uuid=id3), gtirb.ProxyBlock(uuid=id4)),
            symbols=(
                gtirb.Symbol(name="sym1", uuid=id5),
                gtirb.Symbol(name="sym2", uuid=id6),
            ),
            sections=(
                gtirb.Section(name="sect1", uuid=id7),
                gtirb.Section(name="sect2", uuid=id8),
            ),
            uuid=id1,
        )
        self.assertFalse(m1.deep_eq(m2))

        m2 = gtirb.Module(
            aux_data={"key": gtirb.AuxData("value", "string")},
            binary_path="binary_path",
            file_format=gtirb.Module.FileFormat.ELF,
            isa=gtirb.Module.ISA.X64,
            name="other_name",
            preferred_addr=1,
            rebase_delta=2,
            entry_point=gtirb.CodeBlock(size=1, uuid=id2),
            proxies=(gtirb.ProxyBlock(uuid=id3), gtirb.ProxyBlock(uuid=id4)),
            symbols=(
                gtirb.Symbol(name="sym1", uuid=id5),
                gtirb.Symbol(name="sym2", uuid=id6),
            ),
            sections=(
                gtirb.Section(name="sect1", uuid=id7),
                gtirb.Section(name="sect2", uuid=id8),
            ),
            uuid=id1,
        )
        self.assertFalse(m1.deep_eq(m2))

        m2 = gtirb.Module(
            aux_data={"key": gtirb.AuxData("value", "string")},
            binary_path="binary_path",
            file_format=gtirb.Module.FileFormat.ELF,
            isa=gtirb.Module.ISA.X64,
            name="name",
            preferred_addr=5,
            rebase_delta=2,
            entry_point=gtirb.CodeBlock(size=1, uuid=id2),
            proxies=(gtirb.ProxyBlock(uuid=id3), gtirb.ProxyBlock(uuid=id4)),
            symbols=(
                gtirb.Symbol(name="sym1", uuid=id5),
                gtirb.Symbol(name="sym2", uuid=id6),
            ),
            sections=(
                gtirb.Section(name="sect1", uuid=id7),
                gtirb.Section(name="sect2", uuid=id8),
            ),
            uuid=id1,
        )
        self.assertFalse(m1.deep_eq(m2))

        m2 = gtirb.Module(
            aux_data={"key": gtirb.AuxData("value", "string")},
            binary_path="binary_path",
            file_format=gtirb.Module.FileFormat.ELF,
            isa=gtirb.Module.ISA.X64,
            name="name",
            preferred_addr=1,
            rebase_delta=5,
            entry_point=gtirb.CodeBlock(size=1, uuid=id2),
            proxies=(gtirb.ProxyBlock(uuid=id3), gtirb.ProxyBlock(uuid=id4)),
            symbols=(
                gtirb.Symbol(name="sym1", uuid=id5),
                gtirb.Symbol(name="sym2", uuid=id6),
            ),
            sections=(
                gtirb.Section(name="sect1", uuid=id7),
                gtirb.Section(name="sect2", uuid=id8),
            ),
            uuid=id1,
        )
        self.assertFalse(m1.deep_eq(m2))

        m2 = gtirb.Module(
            aux_data={"key": gtirb.AuxData("value", "string")},
            binary_path="binary_path",
            file_format=gtirb.Module.FileFormat.ELF,
            isa=gtirb.Module.ISA.X64,
            name="name",
            preferred_addr=1,
            rebase_delta=2,
            entry_point=gtirb.CodeBlock(size=2, uuid=id2),
            proxies=(gtirb.ProxyBlock(uuid=id3), gtirb.ProxyBlock(uuid=id4)),
            symbols=(
                gtirb.Symbol(name="sym1", uuid=id5),
                gtirb.Symbol(name="sym2", uuid=id6),
            ),
            sections=(
                gtirb.Section(name="sect1", uuid=id7),
                gtirb.Section(name="sect2", uuid=id8),
            ),
            uuid=id1,
        )
        self.assertFalse(m1.deep_eq(m2))

        m2 = gtirb.Module(
            aux_data={"key": gtirb.AuxData("value", "string")},
            binary_path="binary_path",
            file_format=gtirb.Module.FileFormat.ELF,
            isa=gtirb.Module.ISA.X64,
            name="name",
            preferred_addr=1,
            rebase_delta=2,
            entry_point=gtirb.CodeBlock(size=1, uuid=id2),
            proxies=(gtirb.ProxyBlock(uuid=id4), gtirb.ProxyBlock(uuid=id4)),
            symbols=(
                gtirb.Symbol(name="sym1", uuid=id5),
                gtirb.Symbol(name="sym2", uuid=id6),
            ),
            sections=(
                gtirb.Section(name="sect1", uuid=id7),
                gtirb.Section(name="sect2", uuid=id8),
            ),
            uuid=id1,
        )
        self.assertFalse(m1.deep_eq(m2))

        m2 = gtirb.Module(
            aux_data={"key": gtirb.AuxData("value", "string")},
            binary_path="binary_path",
            file_format=gtirb.Module.FileFormat.ELF,
            isa=gtirb.Module.ISA.X64,
            name="name",
            preferred_addr=1,
            rebase_delta=2,
            entry_point=gtirb.CodeBlock(size=1, uuid=id2),
            proxies=(gtirb.ProxyBlock(uuid=id4),),
            symbols=(
                gtirb.Symbol(name="sym1", uuid=id5),
                gtirb.Symbol(name="sym2", uuid=id6),
            ),
            sections=(
                gtirb.Section(name="sect1", uuid=id7),
                gtirb.Section(name="sect2", uuid=id8),
            ),
            uuid=id1,
        )
        self.assertFalse(m1.deep_eq(m2))

        m2 = gtirb.Module(
            aux_data={"key": gtirb.AuxData("value", "string")},
            binary_path="binary_path",
            file_format=gtirb.Module.FileFormat.ELF,
            isa=gtirb.Module.ISA.X64,
            name="name",
            preferred_addr=1,
            rebase_delta=2,
            entry_point=gtirb.CodeBlock(size=1, uuid=id2),
            proxies=(gtirb.ProxyBlock(uuid=id3), gtirb.ProxyBlock(uuid=id4)),
            symbols=(
                gtirb.Symbol(name="sym11", uuid=id5),
                gtirb.Symbol(name="sym2", uuid=id6),
            ),
            sections=(
                gtirb.Section(name="sect1", uuid=id7),
                gtirb.Section(name="sect2", uuid=id8),
            ),
            uuid=id1,
        )
        self.assertFalse(m1.deep_eq(m2))

        m2 = gtirb.Module(
            aux_data={"key": gtirb.AuxData("value", "string")},
            binary_path="binary_path",
            file_format=gtirb.Module.FileFormat.ELF,
            isa=gtirb.Module.ISA.X64,
            name="name",
            preferred_addr=1,
            rebase_delta=2,
            entry_point=gtirb.CodeBlock(size=1, uuid=id2),
            proxies=(gtirb.ProxyBlock(uuid=id3), gtirb.ProxyBlock(uuid=id4)),
            symbols=(gtirb.Symbol(name="sym1", uuid=id5),),
            sections=(
                gtirb.Section(name="sect1", uuid=id7),
                gtirb.Section(name="sect2", uuid=id8),
            ),
            uuid=id1,
        )
        self.assertFalse(m1.deep_eq(m2))

        m2 = gtirb.Module(
            aux_data={"key": gtirb.AuxData("value", "string")},
            binary_path="binary_path",
            file_format=gtirb.Module.FileFormat.ELF,
            isa=gtirb.Module.ISA.X64,
            name="name",
            preferred_addr=1,
            rebase_delta=2,
            entry_point=gtirb.CodeBlock(size=1, uuid=id2),
            proxies=(gtirb.ProxyBlock(uuid=id3), gtirb.ProxyBlock(uuid=id4)),
            symbols=(
                gtirb.Symbol(name="sym1", uuid=id5),
                gtirb.Symbol(name="sym2", uuid=id6),
            ),
            sections=(
                gtirb.Section(name="sect1", uuid=id7),
                gtirb.Section(name="sect22", uuid=id8),
            ),
            uuid=id1,
        )
        self.assertFalse(m1.deep_eq(m2))

        m2 = gtirb.Module(
            aux_data={"key": gtirb.AuxData("value", "string")},
            binary_path="binary_path",
            file_format=gtirb.Module.FileFormat.ELF,
            isa=gtirb.Module.ISA.X64,
            name="name",
            preferred_addr=1,
            rebase_delta=2,
            entry_point=gtirb.CodeBlock(size=1, uuid=id2),
            proxies=(gtirb.ProxyBlock(uuid=id3), gtirb.ProxyBlock(uuid=id4)),
            symbols=(
                gtirb.Symbol(name="sym1", uuid=id5),
                gtirb.Symbol(name="sym2", uuid=id6),
            ),
            sections=(gtirb.Section(name="sect2", uuid=id8),),
            uuid=id1,
        )
        self.assertFalse(m1.deep_eq(m2))

        m2 = gtirb.Module(
            aux_data={"key": gtirb.AuxData("value", "string")},
            binary_path="binary_path",
            file_format=gtirb.Module.FileFormat.ELF,
            isa=gtirb.Module.ISA.X64,
            name="name",
            preferred_addr=1,
            rebase_delta=2,
            entry_point=gtirb.CodeBlock(size=1, uuid=id2),
            proxies=(gtirb.ProxyBlock(uuid=id3), gtirb.ProxyBlock(uuid=id4)),
            symbols=(
                gtirb.Symbol(name="sym1", uuid=id5),
                gtirb.Symbol(name="sym2", uuid=id6),
            ),
            sections=(
                gtirb.Section(name="sect1", uuid=id7),
                gtirb.Section(name="sect2", uuid=id8),
            ),
            uuid=id2,
        )
        self.assertFalse(m1.deep_eq(m2))

    def test_ir(self):
        id1 = uuid.uuid4()
        id2 = uuid.uuid4()
        id3 = uuid.uuid4()
        id4 = uuid.uuid4()
        id5 = uuid.uuid4()
        id6 = uuid.uuid4()
        id7 = uuid.uuid4()
        id8 = uuid.uuid4()

        ir1 = gtirb.IR(
            modules=(
                gtirb.Module(name="m1", uuid=id2),
                gtirb.Module(name="m2", uuid=id3),
            ),
            aux_data={"key": gtirb.AuxData("value", "string")},
            cfg=(
                gtirb.Edge(
                    gtirb.CodeBlock(size=1, uuid=id4),
                    gtirb.CodeBlock(size=2, uuid=id5),
                ),
                gtirb.Edge(
                    gtirb.CodeBlock(size=3, uuid=id6),
                    gtirb.CodeBlock(size=4, uuid=id7),
                ),
            ),
            version=1,
            uuid=id1,
        )
        ir2 = gtirb.IR(
            modules=(
                gtirb.Module(name="m1", uuid=id2),
                gtirb.Module(name="m2", uuid=id3),
            ),
            aux_data={"key": gtirb.AuxData("value", "string")},
            cfg=(
                gtirb.Edge(
                    gtirb.CodeBlock(size=1, uuid=id4),
                    gtirb.CodeBlock(size=2, uuid=id5),
                ),
                gtirb.Edge(
                    gtirb.CodeBlock(size=3, uuid=id6),
                    gtirb.CodeBlock(size=4, uuid=id7),
                ),
            ),
            version=1,
            uuid=id1,
        )
        self.assertTrue(ir1.deep_eq(ir2))

        ir2 = gtirb.IR(
            modules=(
                gtirb.Module(name="m1", uuid=id2),
                gtirb.Module(name="m2", uuid=id3),
            ),
            aux_data={"key": gtirb.AuxData("other_value", "string")},
            cfg=(
                gtirb.Edge(
                    gtirb.CodeBlock(size=1, uuid=id4),
                    gtirb.CodeBlock(size=2, uuid=id5),
                ),
                gtirb.Edge(
                    gtirb.CodeBlock(size=3, uuid=id6),
                    gtirb.CodeBlock(size=4, uuid=id7),
                ),
            ),
            version=1,
            uuid=id1,
        )
        self.assertTrue(ir1.deep_eq(ir2))

        ir2 = gtirb.IR(
            modules=(
                gtirb.Module(name="m11", uuid=id2),
                gtirb.Module(name="m2", uuid=id3),
            ),
            aux_data={"key": gtirb.AuxData("value", "string")},
            cfg=(
                gtirb.Edge(
                    gtirb.CodeBlock(size=1, uuid=id4),
                    gtirb.CodeBlock(size=2, uuid=id5),
                ),
                gtirb.Edge(
                    gtirb.CodeBlock(size=3, uuid=id6),
                    gtirb.CodeBlock(size=4, uuid=id7),
                ),
            ),
            version=1,
            uuid=id1,
        )
        self.assertFalse(ir1.deep_eq(ir2))

        ir2 = gtirb.IR(
            modules=(gtirb.Module(name="m1", uuid=id2),),
            aux_data={"key": gtirb.AuxData("value", "string")},
            cfg=(
                gtirb.Edge(
                    gtirb.CodeBlock(size=1, uuid=id4),
                    gtirb.CodeBlock(size=2, uuid=id5),
                ),
                gtirb.Edge(
                    gtirb.CodeBlock(size=3, uuid=id6),
                    gtirb.CodeBlock(size=4, uuid=id7),
                ),
            ),
            version=1,
            uuid=id1,
        )
        self.assertFalse(ir1.deep_eq(ir2))

        ir2 = gtirb.IR(
            modules=(
                gtirb.Module(name="m1", uuid=id2),
                gtirb.Module(name="m2", uuid=id3),
            ),
            aux_data={"key": gtirb.AuxData("value", "string")},
            cfg=(
                gtirb.Edge(
                    gtirb.CodeBlock(size=55, uuid=id4),
                    gtirb.CodeBlock(size=2, uuid=id5),
                ),
                gtirb.Edge(
                    gtirb.CodeBlock(size=3, uuid=id6),
                    gtirb.CodeBlock(size=4, uuid=id7),
                ),
            ),
            version=1,
            uuid=id1,
        )
        self.assertFalse(ir1.deep_eq(ir2))

        ir2 = gtirb.IR(
            modules=(
                gtirb.Module(name="m1", uuid=id2),
                gtirb.Module(name="m2", uuid=id3),
            ),
            aux_data={"key": gtirb.AuxData("value", "string")},
            cfg=(
                gtirb.Edge(
                    gtirb.CodeBlock(size=3, uuid=id6),
                    gtirb.CodeBlock(size=4, uuid=id7),
                ),
            ),
            version=1,
            uuid=id1,
        )
        self.assertFalse(ir1.deep_eq(ir2))

        ir2 = gtirb.IR(
            modules=(
                gtirb.Module(name="m1", uuid=id2),
                gtirb.Module(name="m2", uuid=id3),
            ),
            aux_data={"key": gtirb.AuxData("value", "string")},
            cfg=(
                gtirb.Edge(
                    gtirb.CodeBlock(size=1, uuid=id4),
                    gtirb.CodeBlock(size=2, uuid=id5),
                ),
                gtirb.Edge(
                    gtirb.CodeBlock(size=3, uuid=id6),
                    gtirb.CodeBlock(size=4, uuid=id7),
                ),
            ),
            version=5,
            uuid=id1,
        )
        self.assertFalse(ir1.deep_eq(ir2))

        ir2 = gtirb.IR(
            modules=(
                gtirb.Module(name="m1", uuid=id2),
                gtirb.Module(name="m2", uuid=id3),
            ),
            aux_data={"key": gtirb.AuxData("value", "string")},
            cfg=(
                gtirb.Edge(
                    gtirb.CodeBlock(size=1, uuid=id4),
                    gtirb.CodeBlock(size=2, uuid=id5),
                ),
                gtirb.Edge(
                    gtirb.CodeBlock(size=3, uuid=id6),
                    gtirb.CodeBlock(size=4, uuid=id7),
                ),
            ),
            version=1,
            uuid=id8,
        )
        self.assertFalse(ir1.deep_eq(ir2))


if __name__ == "__main__":
    unittest.main()


================================================
FILE: python/tests/test_ir.py
================================================
import io
import os
import pathlib
import tempfile
import unittest

from google.protobuf.message import DecodeError

import gtirb

IR_FILE = tempfile.mktemp(suffix=".gtirb")


class IRTest(unittest.TestCase):
    def __init__(self, *args, **kwargs):
        super().__init__(*args, **kwargs)

        ir = gtirb.IR()
        m = gtirb.Module(
            binary_path="binary_path",
            file_format=gtirb.Module.FileFormat.RAW,
            isa=gtirb.Module.ISA.ValidButUnsupported,
            name="name",
            preferred_addr=1,
            rebase_delta=2,
            ir=ir,
        )
        s = gtirb.Section(
            name="name",
            flags=(
                gtirb.Section.Flag.Executable,
                gtirb.Section.Flag.Readable,
                gtirb.Section.Flag.Loaded,
                gtirb.Section.Flag.Initialized,
            ),
            module=m,
        )
        bi = gtirb.ByteInterval(
            address=0, size=10, contents=b"abcd", section=s
        )
        cb = gtirb.CodeBlock(
            size=4,
            offset=0,
            decode_mode=gtirb.CodeBlock.DecodeMode.Thumb,
            byte_interval=bi,
        )
        _ = gtirb.DataBlock(size=6, offset=4, byte_interval=bi)
        sym = gtirb.Symbol(name="name", payload=cb, module=m)
        sac = gtirb.SymAddrConst(
            0, sym, {gtirb.SymbolicExpression.Attribute.G1}
        )
        bi.symbolic_expressions[2] = sac
        p = gtirb.ProxyBlock(module=m)
        ir.cfg.add(
            gtirb.Edge(
                cb,
                p,
                gtirb.Edge.Label(
                    type=gtirb.Edge.Type.Branch, conditional=False, direct=True
                ),
            )
        )
        ir.cfg.add(gtirb.Edge(p, p))
        m.aux_data["key"] = gtirb.AuxData(gtirb.Offset(s, 777), "Offset")
        ir.aux_data["key"] = gtirb.AuxData("value", "string")

        self.ir = ir

    def setUp(self):
        self.ir.save_protobuf(IR_FILE)

    def tearDown(self):
        os.remove(IR_FILE)

    def test_ir_protobuf_load(self):
        new_ir = gtirb.IR.load_protobuf(IR_FILE)
        self.assertTrue(self.ir.deep_eq(new_ir))
        self.assertNotEqual(
            self.ir.modules[0].aux_data["key"].data,
            new_ir.modules[0].aux_data["key"].data,
        )

    def test_load_pathlib(self):
        """
        Ensure `load_protobuf` and `save_protobuf` support path-like objects
        """
        ir_path = pathlib.Path(IR_FILE)
        new_ir = gtirb.IR.load_protobuf(ir_path)
        self.assertTrue(self.ir.deep_eq(new_ir))
        self.assertNotEqual(
            self.ir.modules[0].aux_data["key"].data,
            new_ir.modules[0].aux_data["key"].data,
        )
        new_ir.save_protobuf(ir_path)


class NotGTIRBTest(unittest.TestCase):
    def test(self):
        file_content = io.BytesIO(b"JUNK")
        with self.assertRaises(Exception) as context:
            gtirb.IR.load_protobuf_file(file_content)

        self.assertEqual(
            "File missing GTIRB magic - not a GTIRB file?",
            str(context.exception),
        )


class BadVersionTest(unittest.TestCase):
    def test(self):
        file_content = io.BytesIO(b"GTIRB\x00\x00\xFF")
        with self.assertRaises(Exception) as context:
            gtirb.IR.load_protobuf_file(file_content)

        self.assertTrue(
            "Attempt to decode IR of version" in str(context.exception)
        )


class BadProtobufTest(unittest.TestCase):
    def test(self):
        bytes = b"GTIRB\x00\x00"
        bytes += gtirb.version.PROTOBUF_VERSION.to_bytes(1, byteorder="little")
        bytes += b"JUNK"
        file_content = io.BytesIO(bytes)
        with self.assertRaises(DecodeError) as context:
            gtirb.IR.load_protobuf_file(file_content)


class IRMethodTests(unittest.TestCase):
    def test_modules_named(self):
        """
        Test the IR.modules_named method
        """
        ir = gtirb.IR()

        def add_module(name: str):
            return gtirb.Module(
                file_format=gtirb.Module.FileFormat.RAW,
                isa=gtirb.Module.ISA.ValidButUnsupported,
                name=name,
                ir=ir,
            )

        m1 = add_module("m1")
        m2 = add_module("m2")
        m3_a = add_module("m3")
        m3_b = add_module("m3")

        self.assertEqual(next(ir.modules_named("m1")), m1)
        self.assertEqual(next(ir.modules_named("m2")), m2)
        m3s = list(ir.modules_named("m3"))
        self.assertEqual(len(m3s), 2)
        self.assertIn(m3_a, m3s)
        self.assertIn(m3_b, m3s)


if __name__ == "__main__":
    unittest.main()


================================================
FILE: python/tests/test_module.py
================================================
import unittest

import gtirb


class ModuleTests(unittest.TestCase):
    def test_symbols_named(self):
        m = gtirb.Module(name="test")
        s1 = gtirb.Symbol(name="hello", module=m)
        s2 = gtirb.Symbol(name="world", module=m)

        found = set(m.symbols_named("hello"))
        self.assertEqual(found, {s1})

        found = set(m.symbols_named("world"))
        self.assertEqual(found, {s2})

        # Change the name to verify we update the index
        s1.name = "world"
        found = set(m.symbols_named("hello"))
        self.assertEqual(found, set())

        found = set(m.symbols_named("world"))
        self.assertEqual(found, {s1, s2})

        # Discard the symbol to verify we update the index
        m.symbols.discard(s1)
        found = set(m.symbols_named("world"))
        self.assertEqual(found, {s2})

        # Now add it back to verify we update the index
        m.symbols.add(s1)
        found = set(m.symbols_named("world"))
        self.assertEqual(found, {s1, s2})


================================================
FILE: python/tests/test_node_from_uuid.py
================================================
import unittest
import uuid

import gtirb


class NodeFromUUIDTest(unittest.TestCase):
    def test_get_by_uuid_failed(self):
        bad_id = uuid.uuid4()
        node = gtirb.IR().get_by_uuid(bad_id)
        self.assertIsNone(node)

    def test_get_by_uuid(self):
        ir1 = gtirb.IR()
        ir2 = gtirb.IR()

        # test nodes from one IR don't pollute the cache of other IRs
        self.assertIsNone(ir1.get_by_uuid(ir2.uuid))
        self.assertIsNone(ir2.get_by_uuid(ir1.uuid))
        self.assertEqual(ir1.get_by_uuid(ir1.uuid), ir1)
        self.assertEqual(ir2.get_by_uuid(ir2.uuid), ir2)

        m = gtirb.Module(name="M")
        m.ir = ir1
        s = gtirb.Section()
        s.module = m
        bi = gtirb.ByteInterval()
        bi.section = s
        b = gtirb.CodeBlock()
        b.byte_interval = bi
        sym = gtirb.Symbol("test")
        sym.module = m

        # test all nodes are lookupable by any other node type
        self.assertEqual(ir1.get_by_uuid(m.uuid), m)
        self.assertEqual(ir1.get_by_uuid(s.uuid), s)
        self.assertEqual(ir1.get_by_uuid(bi.uuid), bi)
        self.assertEqual(ir1.get_by_uuid(b.uuid), b)
        self.assertEqual(ir1.get_by_uuid(sym.uuid), sym)

        self.assertEqual(m.ir.get_by_uuid(m.uuid), m)
        self.assertEqual(m.ir.get_by_uuid(s.uuid), s)
        self.assertEqual(m.ir.get_by_uuid(bi.uuid), bi)
        self.assertEqual(m.ir.get_by_uuid(b.uuid), b)
        self.assertEqual(m.ir.get_by_uuid(sym.uuid), sym)

        self.assertEqual(s.ir.get_by_uuid(m.uuid), m)
        self.assertEqual(s.ir.get_by_uuid(s.uuid), s)
        self.assertEqual(s.ir.get_by_uuid(bi.uuid), bi)
        self.assertEqual(s.ir.get_by_uuid(b.uuid), b)
        self.assertEqual(s.ir.get_by_uuid(sym.uuid), sym)

        self.assertEqual(bi.ir.get_by_uuid(m.uuid), m)
        self.assertEqual(bi.ir.get_by_uuid(s.uuid), s)
        self.assertEqual(bi.ir.get_by_uuid(bi.uuid), bi)
        self.assertEqual(bi.ir.get_by_uuid(b.uuid), b)
        self.assertEqual(bi.ir.get_by_uuid(sym.uuid), sym)

        self.assertEqual(b.ir.get_by_uuid(m.uuid), m)
        self.assertEqual(b.ir.get_by_uuid(s.uuid), s)
        self.assertEqual(b.ir.get_by_uuid(bi.uuid), bi)
        self.assertEqual(b.ir.get_by_uuid(b.uuid), b)
        self.assertEqual(b.ir.get_by_uuid(sym.uuid), sym)

        self.assertEqual(sym.ir.get_by_uuid(m.uuid), m)
        self.assertEqual(sym.ir.get_by_uuid(s.uuid), s)
        self.assertEqual(sym.ir.get_by_uuid(bi.uuid), bi)
        self.assertEqual(sym.ir.get_by_uuid(b.uuid), b)
        self.assertEqual(sym.ir.get_by_uuid(sym.uuid), sym)

        # test removing a node removes all children as well
        bi.section = None

        self.assertEqual(ir1.get_by_uuid(m.uuid), m)
        self.assertEqual(ir1.get_by_uuid(s.uuid), s)
        self.assertIsNone(ir1.get_by_uuid(bi.uuid))
        self.assertIsNone(ir1.get_by_uuid(b.uuid))
        self.assertEqual(ir1.get_by_uuid(sym.uuid), sym)

        bi.section = s

        self.assertEqual(ir1.get_by_uuid(m.uuid), m)
        self.assertEqual(ir1.get_by_uuid(s.uuid), s)
        self.assertEqual(ir1.get_by_uuid(bi.uuid), bi)
        self.assertEqual(ir1.get_by_uuid(b.uuid), b)
        self.assertEqual(ir1.get_by_uuid(sym.uuid), sym)

    def test_remove_from_cache(self):
        ir = gtirb.IR()
        m = gtirb.Module(name="M")
        m.ir = ir
        s = gtirb.Section()

        s.module = m
        self.assertEqual(ir.get_by_uuid(s.uuid), s)

        s.module = None
        self.assertIsNone(ir.get_by_uuid(s.uuid))

        m.sections.discard(s)
        self.assertIsNone(ir.get_by_uuid(s.uuid))


if __name__ == "__main__":
    unittest.main()


================================================
FILE: python/tests/test_properties.py
================================================
import unittest

import gtirb


class TestProperties(unittest.TestCase):
    def test_data_blocks(self):
        b = gtirb.DataBlock()

        self.assertEqual(b.address, None)
        self.assertEqual(b.contents, b"")
        self.assertEqual(set(b.references), set())

        bi = gtirb.ByteInterval(address=1, contents=b"abcd1234")
        b.offset = 2
        b.size = 3
        b.byte_interval = bi

        self.assertEqual(b.address, 3)
        self.assertEqual(b.contents, b"cd1")
        self.assertEqual(set(b.references), set())

        s = gtirb.Section()
        bi.section = s
        m = gtirb.Module(name="M")
        sym1 = gtirb.Symbol("test", payload=b)
        sym2 = gtirb.Symbol("test", payload=123)
        sym3 = gtirb.Symbol("test", payload=b)
        m.symbols |= {sym1, sym2, sym3}
        s.module = m

        self.assertEqual(b.address, 3)
        self.assertEqual(b.contents, b"cd1")
        self.assertEqual(set(b.references), {sym1, sym3})

    def test_code_blocks(self):
        b = gtirb.CodeBlock()

        self.assertEqual(b.address, None)
        self.assertEqual(b.contents, b"")
        self.assertEqual(set(b.references), set())
        self.assertEqual(set(b.incoming_edges), set())
        self.assertEqual(set(b.outgoing_edges), set())

        bi = gtirb.ByteInterval(address=1, contents=b"abcd1234")
        b.offset = 2
        b.size = 3
        b.byte_interval = bi

        self.assertEqual(b.address, 3)
        self.assertEqual(b.contents, b"cd1")
        self.assertEqual(set(b.references), set())
        self.assertEqual(set(b.incoming_edges), set())
        self.assertEqual(set(b.outgoing_edges), set())

        s = gtirb.Section()
        bi.section = s
        m = gtirb.Module(name="M")
        sym1 = gtirb.Symbol("test", payload=b)
        sym2 = gtirb.Symbol("test", payload=123)
        sym3 = gtirb.Symbol("test", payload=b)
        m.symbols |= {sym1, sym2, sym3}
        s.module = m

        self.assertEqual(b.address, 3)
        self.assertEqual(b.contents, b"cd1")
        self.assertEqual(set(b.references), {sym1, sym3})
        self.assertEqual(set(b.incoming_edges), set())
        self.assertEqual(set(b.outgoing_edges), set())

        i = gtirb.IR()
        m.ir = i
        p1 = gtirb.ProxyBlock()
        p2 = gtirb.ProxyBlock()
        p3 = gtirb.ProxyBlock()
        p4 = gtirb.ProxyBlock()
        i.cfg.add(gtirb.Edge(b, p1))
        i.cfg.add(gtirb.Edge(p2, b))
        i.cfg.add(gtirb.Edge(p3, p4))
        i.cfg.add(gtirb.Edge(b, b))

        self.assertEqual(b.address, 3)
        self.assertEqual(b.contents, b"cd1")
        self.assertEqual(set(b.references), {sym1, sym3})
        self.assertEqual(
            set((s, t) for s, t, l in b.incoming_edges), {(p2, b), (b, b)}
        )
        self.assertEqual(
            set((s, t) for s, t, l in b.outgoing_edges), {(b, p1), (b, b)}
        )

    def test_proxy_blocks(self):
        b = gtirb.ProxyBlock()

        self.assertEqual(set(b.references), set())
        self.assertEqual(set(b.incoming_edges), set())
        self.assertEqual(set(b.outgoing_edges), set())

        m = gtirb.Module(name="M")
        sym1 = gtirb.Symbol("test", payload=b)
        sym2 = gtirb.Symbol("test", payload=123)
        sym3 = gtirb.Symbol("test", payload=b)
        m.symbols |= {sym1, sym2, sym3}
        b.module = m

        self.assertEqual(set(b.references), {sym1, sym3})
        self.assertEqual(set(b.incoming_edges), set())
        self.assertEqual(set(b.outgoing_edges), set())

        i = gtirb.IR()
        m.ir = i
        p1 = gtirb.ProxyBlock()
        p2 = gtirb.ProxyBlock()
        p3 = gtirb.ProxyBlock()
        p4 = gtirb.ProxyBlock()
        i.cfg.add(gtirb.Edge(b, p1))
        i.cfg.add(gtirb.Edge(p2, b))
        i.cfg.add(gtirb.Edge(p3, p4))
        i.cfg.add(gtirb.Edge(b, b))

        self.assertEqual(set(b.references), {sym1, sym3})
        self.assertEqual(
            set((s, t) for s, t, l in b.incoming_edges), {(p2, b), (b, b)}
        )
        self.assertEqual(
            set((s, t) for s, t, l in b.outgoing_edges), {(b, p1), (b, b)}
        )

    def test_sections(self):
        s = gtirb.Section()
        self.assertEqual(s.address, None)
        self.assertEqual(s.size, None)

        s.byte_intervals.clear()
        s.byte_intervals |= {gtirb.ByteInterval()}
        self.assertEqual(s.address, None)
        self.assertEqual(s.size, None)

        s.byte_intervals.clear()
        s.byte_intervals |= {gtirb.ByteInterval(size=3)}
        self.assertEqual(s.address, None)
        self.assertEqual(s.size, None)

        s.byte_intervals.clear()
        s.byte_intervals |= {gtirb.ByteInterval(address=2, size=4)}
        self.assertEqual(s.address, 2)
        self.assertEqual(s.size, 4)

        s.byte_intervals.clear()
        s.byte_intervals |= {
            gtirb.ByteInterval(address=2, size=4),
            gtirb.ByteInterval(size=3),
        }
        self.assertEqual(s.address, None)
        self.assertEqual(s.size, None)

        s.byte_intervals.clear()
        s.byte_intervals |= {
            gtirb.ByteInterval(address=2, size=4),
            gtirb.ByteInterval(address=100, size=3),
        }
        self.assertEqual(s.address, 2)
        self.assertEqual(s.size, 101)

    def test_modules(self):
        s1 = gtirb.Section(
            name="s1", byte_intervals=[gtirb.ByteInterval(address=4, size=4)]
        )
        s2 = gtirb.Section(
            name="s2", byte_intervals=[gtirb.ByteInterval(address=8, size=8)]
        )
        s3 = gtirb.Section(
            name="s3", byte_intervals=[gtirb.ByteInterval(address=100, size=1)]
        )
        s4 = gtirb.Section(
            name="s4", byte_intervals=[gtirb.ByteInterval(size=1000)]
        )
        m = gtirb.Module(name="M", sections=[s1, s2, s3, s4])

        self.assertEqual(set(m.sections_on(3)), set())
        self.assertEqual(set(m.sections_on(4)), {s1})
        self.assertEqual(set(m.sections_on(7)), {s1})
        self.assertEqual(set(m.sections_on(8)), {s2})
        self.assertEqual(set(m.sections_on(15)), {s2})
        self.assertEqual(set(m.sections_on(16)), set())
        self.assertEqual(set(m.sections_on(99)), set())
        self.assertEqual(set(m.sections_on(100)), {s3})
        self.assertEqual(set(m.sections_on(101)), set())

        self.assertEqual(set(m.sections_on(range(0, 100))), {s1, s2})
        self.assertEqual(set(m.sections_on(range(0, 101))), {s1, s2, s3})
        self.assertEqual(set(m.sections_on(range(0, 102))), {s1, s2, s3})
        self.assertEqual(set(m.sections_on(range(7, 7 + 4))), {s1, s2})
        self.assertEqual(set(m.sections_on(range(8, 8 + 4))), {s2})
        self.assertEqual(set(m.sections_on(range(17, 17 + 80))), set())

        self.assertEqual(set(m.sections_at(3)), set())
        self.assertEqual(set(m.sections_at(4)), {s1})
        self.assertEqual(set(m.sections_at(5)), set())
        self.assertEqual(set(m.sections_at(7)), set())
        self.assertEqual(set(m.sections_at(8)), {s2})
        self.assertEqual(set(m.sections_at(9)), set())
        self.assertEqual(set(m.sections_at(99)), set())
        self.assertEqual(set(m.sections_at(100)), {s3})
        self.assertEqual(set(m.sections_at(101)), set())

        self.assertEqual(set(m.sections_at(range(0, 100))), {s1, s2})
        self.assertEqual(set(m.sections_at(range(0, 101))), {s1, s2, s3})
        self.assertEqual(set(m.sections_at(range(5, 10))), {s2})
        self.assertEqual(set(m.sections_at(range(95, 105))), {s3})

    def test_byte_intervals(self):
        s = gtirb.Symbol(name="test")
        se1 = gtirb.SymAddrConst(0, s)
        se3 = gtirb.SymAddrAddr(0, 1, s, s)
        bi = gtirb.ByteInterval(
            address=10, size=5, symbolic_expressions={0: se1, 4: se3}
        )

        self.assertEqual(set(bi.symbolic_expressions_at(9)), set())
        self.assertEqual(set(bi.symbolic_expressions_at(10)), {(bi, 0, se1)})
        self.assertEqual(set(bi.symbolic_expressions_at(11)), set())
        self.assertEqual(set(bi.symbolic_expressions_at(13)), set())
        self.assertEqual(set(bi.symbolic_expressions_at(14)), {(bi, 4, se3)})
        self.assertEqual(set(bi.symbolic_expressions_at(15)), set())

        self.assertEqual(set(bi.symbolic_expressions_at(range(0, 9))), set())
        self.assertEqual(set(bi.symbolic_expressions_at(range(11, 14))), set())
        self.assertEqual(set(bi.symbolic_expressions_at(range(20, 90))), set())
        self.assertEqual(
            set(bi.symbolic_expressions_at(range(0, 90))),
            {(bi, 0, se1), (bi, 4, se3)},
        )
        self.assertEqual(
            set(bi.symbolic_expressions_at(range(10, 15))),
            {(bi, 0, se1), (bi, 4, se3)},
        )
        self.assertEqual(
            set(bi.symbolic_expressions_at(range(11, 18))), {(bi, 4, se3)}
        )

    def test_sym_exprs(self):
        node = gtirb.SymAddrConst(
            offset=123,
            symbol=gtirb.Symbol(name="symbol", payload=gtirb.ProxyBlock()),
        )
        self.assertEqual({x.name for x in node.symbols}, {"symbol"})

        node = gtirb.SymAddrAddr(
            offset=123,
            scale=2,
            symbol1=gtirb.Symbol(name="symbol1", payload=gtirb.ProxyBlock()),
            symbol2=gtirb.Symbol(name="symbol2", payload=gtirb.ProxyBlock()),
        )
        self.assertEqual(
            {x.name for x in node.symbols}, {"symbol1", "symbol2"}
        )


================================================
FILE: python/tests/test_repr.py
================================================
"""isort:skip_file"""

import unittest
import gtirb
import uuid

# imports needed because repr's use of unqualified names
from uuid import UUID  # noqa: F401,F403,F401
from gtirb import *  # noqa: F401,F403,F401


class ReprTest(unittest.TestCase):
    def test_auxdata(self):
        node = gtirb.AuxData(
            type_name="mapping<string,set<UUID>>",
            data={
                "a": set([uuid.uuid4(), uuid.uuid4()]),
                "b": set([uuid.uuid4()]),
            },
        )
        string = repr(node)
        new_node = eval(string)
        # auxdata has no deep_eq
        # (because how can we ensure "data" has a deep_eq?)
        self.assertEqual(node.type_name, new_node.type_name)
        self.assertEqual(node.data, new_node.data)

    def test_block(self):
        node = gtirb.CodeBlock(
            offset=123, size=456, decode_mode=gtirb.CodeBlock.DecodeMode.Thumb
        )
        string = repr(node)
        new_node = eval(string)
        self.assertTrue(node.deep_eq(new_node))

    def test_proxy_block(self):
        node = gtirb.ProxyBlock()
        string = repr(node)
        new_node = eval(string)
        self.assertTrue(node.deep_eq(new_node))

    def test_data_object(self):
        node = gtirb.DataBlock(offset=123, size=456)
        string = repr(node)
        new_node = eval(string)
        self.assertTrue(node.deep_eq(new_node))

    def test_ir(self):
        # TODO: expand this
        node = gtirb.IR()
        string = repr(node)
        new_node = eval(string)
        self.assertTrue(node.deep_eq(new_node))

    def test_cfg(self):
        node = gtirb.CFG()
        node.add(
            gtirb.Edge(
                gtirb.CodeBlock(offset=1, size=2),
                gtirb.CodeBlock(offset=3, size=4),
                gtirb.Edge.Label(
                    type=gtirb.Edge.Type.Fallthrough,
                    conditional=True,
                    direct=False,
                ),
            )
        )
        node.add(
            gtirb.Edge(
                gtirb.CodeBlock(offset=5, size=6),
                gtirb.CodeBlock(offset=7, size=8),
                gtirb.Edge.Label(
                    type=gtirb.Edge.Type.Branch,
                    conditional=True,
                    direct=False,
                ),
            )
        )
        string = repr(node)
        new_node = eval(string)
        self.assertTrue(node.deep_eq(new_node))

    def test_module(self):
        # TODO: expand this
        node = gtirb.Module(name="M")
        string = repr(node)
        new_node = eval(string)
        self.assertTrue(node.deep_eq(new_node))

    def test_offset(self):
        node = gtirb.Offset(element_id=uuid.uuid4(), displacement=123)
        string = repr(node)
        new_node = eval(string)
        self.assertEqual(node.element_id, new_node.element_id)
        self.assertEqual(node.displacement, new_node.displacement)

    def test_section(self):
        node = gtirb.Section(
            name=".text",
            flags=(gtirb.Section.Flag.Readable, gtirb.Section.Flag.Writable),
        )
        string = repr(node)
        new_node = eval(string)
        self.assertTrue(node.deep_eq(new_node))

    def test_symbol(self):
        node = gtirb.Symbol(name="symbol1", payload=gtirb.ProxyBlock())
        string = repr(node)
        new_node = eval(string)
        self.assertTrue(node.deep_eq(new_node))

        node = gtirb.Symbol(name="symbol2", payload=0x123)
        string = repr(node)
        new_node = eval(string)
        self.assertTrue(node.deep_eq(new_node))

        node = gtirb.Symbol(name="symbol3", payload=None)
        string = repr(node)
        new_node = eval(string)
        self.assertTrue(node.deep_eq(new_node))

    def test_sym_expr(self):
        node = gtirb.SymAddrConst(
            offset=123,
            symbol=gtirb.Symbol(name="symbol", payload=gtirb.ProxyBlock()),
            attributes=set(),
        )
        string = repr(node)
        new_node = eval(string)
        self.assertTrue(node.deep_eq(new_node))

        node = gtirb.SymAddrAddr(
            offset=123,
            scale=2,
            symbol1=gtirb.Symbol(name="symbol1", payload=gtirb.ProxyBlock()),
            symbol2=gtirb.Symbol(name="symbol2", payload=gtirb.ProxyBlock()),
            attributes={
                gtirb.SymbolicExpression.Attribute.ABS,
                gtirb.SymbolicExpression.Attribute.G0,
            },
        )
        string = repr(node)
        new_node = eval(string)
        self.assertTrue(node.deep_eq(new_node))

    def test_byte_interval(self):
        node = gtirb.ByteInterval(
            address=0x123,
            initialized_size=456,
            size=789,
            contents=b"abc",
            blocks=(gtirb.DataBlock(size=0),),
            symbolic_expressions={
                1: gtirb.SymAddrConst(offset=1, symbol=gtirb.Symbol("test"))
            },
        )
        string = repr(node)
        new_node = eval(string)
        self.assertTrue(node.deep_eq(new_node))


if __name__ == "__main__":
    unittest.main()


================================================
FILE: python/tests/test_section.py
================================================
import unittest

import gtirb


class SectionTests(unittest.TestCase):
    def test_byte_blocks(self):
        s = gtirb.Section()

        bi1 = gtirb.ByteInterval(size=4, section=s)
        bi1_code_block = gtirb.CodeBlock(offset=0, size=1, byte_interval=bi1)
        bi1_data_block = gtirb.DataBlock(offset=1, size=1, byte_interval=bi1)

        bi2 = gtirb.ByteInterval(size=4, section=s)
        bi2_code_block = gtirb.CodeBlock(offset=0, size=1, byte_interval=bi2)
        bi2_data_block = gtirb.DataBlock(offset=1, size=1, byte_interval=bi2)

        self.assertEqual(
            set(s.byte_blocks),
            {bi1_code_block, bi1_data_block, bi2_code_block, bi2_data_block},
        )
        self.assertEqual(set(s.code_blocks), {bi1_code_block, bi2_code_block})
        self.assertEqual(set(s.data_blocks), {bi1_data_block, bi2_data_block})


================================================
FILE: python/tests/test_serialization.py
================================================
import io
import unittest

import gtirb.serialization
from gtirb.serialization import Variant


class TestSerialization(unittest.TestCase):
    def test_parse_type(self):
        def test_positive(type_name, oracle):
            self.assertEqual(
                gtirb.serialization.Serialization._parse_type(type_name),
                oracle,
            )

        positive_tests = [
            ("mapping", ("mapping", ())),
            ("mapping<FOO,BAR>", ("mapping", (("FOO", ()), ("BAR", ())))),
            (
                "mapping<FOO,set<BAR>>",
                ("mapping", (("FOO", ()), ("set", (("BAR", ()),)))),
            ),
            (
                "mapping<FOO,mapping<BAR,BAZ>>",
                (
                    "mapping",
                    (("FOO", ()), ("mapping", (("BAR", ()), ("BAZ", ())))),
                ),
            ),
            (
                "mapping<mapping<BAR,BAZ>,FOO>",
                (
                    "mapping",
                    (("mapping", (("BAR", ()), ("BAZ", ()))), ("FOO", ())),
                ),
            ),
        ]
        for type_name, oracle in positive_tests:
            test_positive(type_name, oracle)

        def test_negative(type_name):
            with self.assertRaises(
                gtirb.serialization.TypeNameError, msg=type_name
            ):
                gtirb.serialization.Serialization._parse_type(type_name)

        negative_tests = [
            "mapping<<>",
            "mapping<>>",
            "mapping<><>",
            "mapping<<><>>",
            "mapping<<foo><bar>>",
            "mapping<,>",
            "mapping<FOO,>",
            "mapping<,BAR>",
        ]
        for type_name in negative_tests:
            test_negative(type_name)

    def test_unknown_codec(self):
        serializer = gtirb.serialization.Serialization()
        blob = serializer.decode(b"abcd", "foobar")
        self.assertIsInstance(blob, gtirb.serialization.UnknownData)
        self.assertEqual(blob, b"abcd")
        ostream = io.BytesIO()
        serializer.encode(ostream, blob, "foobar")
        self.assertEqual(ostream.getvalue(), b"abcd")

    def test_nested_unknown_codec(self):
        serializer = gtirb.serialization.Serialization()
        ostream = io.BytesIO()
        serializer.encode(
            ostream,
            {"a": ["b", "c"], "d": ["e"]},
            "mapping<string,sequence<string>>",
        )
        raw_bytes = ostream.getvalue()

        blob = serializer.decode(raw_bytes, "mapping<string,sequence<foobar>>")
        self.assertIsInstance(blob, gtirb.serialization.UnknownData)
        ostream = io.BytesIO()
        serializer.encode(ostream, blob, "mapping<string,sequence<foobar>>")
        self.assertEqual(ostream.getvalue(), raw_bytes)

        blob = serializer.decode(raw_bytes, "mapping<foobar,sequence<string>>")
        self.assertIsInstance(blob, gtirb.serialization.UnknownData)
        ostream = io.BytesIO()
        serializer.encode(ostream, blob, "mapping<foobar,sequence<string>>")
        self.assertEqual(ostream.getvalue(), raw_bytes)

    def test_uuid_codec(self):
        ir = gtirb.IR(
            modules=[
                gtirb.Module(
                    name="M",
                    sections=[
                        gtirb.Section(
                            byte_intervals=[
                                gtirb.ByteInterval(blocks=[gtirb.CodeBlock()])
                            ]
                        )
                    ],
                )
            ]
        )
        b = next(iter(ir.code_blocks))

        # test finding block in same IR
        bstream = io.BytesIO()
        gtirb.AuxData.serializer.encode(bstream, b.uuid, "UUID")
        result = gtirb.AuxData.serializer.decode(
            bstream.getvalue(), "UUID", ir.get_by_uuid
        )
        self.assertEqual(result, b)

        # test not finding block with same UUID in other IR
        ir2 = gtirb.IR(
            modules=[
                gtirb.Module(
                    name="M",
                    sections=[
                        gtirb.Section(
                            byte_intervals=[
                                gtirb.ByteInterval(
                                    blocks=[gtirb.CodeBlock(uuid=b.uuid)]
                                )
                            ]
                        )
                    ],
                )
            ]
        )
        b2 = next(iter(ir2.code_blocks))

        bstream = io.BytesIO()
        gtirb.AuxData.serializer.encode(bstream, b.uuid, "UUID")
        result = gtirb.AuxData.serializer.decode(
            bstream.getvalue(), "UUID", ir.get_by_uuid
        )
        self.assertEqual(result, b)

        bstream = io.BytesIO()
        gtirb.AuxData.serializer.encode(bstream, b.uuid, "UUID")
        result = gtirb.AuxData.serializer.decode(
            bstream.getvalue(), "UUID", ir2.get_by_uuid
        )
        self.assertEqual(result, b2)

        # test not finding the UUID of a free block
        b3 = gtirb.CodeBlock()

        bstream = io.BytesIO()
        gtirb.AuxData.serializer.encode(bstream, b3.uuid, "UUID")
        result = gtirb.AuxData.serializer.decode(
            bstream.getvalue(), "UUID", ir.get_by_uuid
        )
        self.assertEqual(result, b3.uuid)

    def test_variant_codec(self):
        serializer = gtirb.serialization.Serialization()
        ostream = io.BytesIO()
        variant = Variant(2, {5: ["a", "b"], 15: ["cc", "ddd"]})
        serializer.encode(
            ostream,
            variant,
            "variant<string,int64_t,mapping<int64_t,sequence<string>>>",
        )
        raw_bytes = ostream.getvalue()
        var_val = serializer.decode(
            raw_bytes,
            "variant<string,int64_t,mapping<int64_t,sequence<string>>>",
        )
        self.assertEqual(var_val, variant)

        ostream = io.BytesIO()
        variant = Variant(1, 10)
        serializer.encode(
            ostream,
            variant,
            "variant<string,int64_t,string>",
        )
        raw_bytes = ostream.getvalue()
        var_val = serializer.decode(
            raw_bytes, "variant<string,int64_t,string>"
        )
        self.assertEqual(var_val, variant)

        ostream = io.BytesIO()
        variant = Variant(0, "zzzz")
        serializer.encode(
            ostream,
            variant,
            "variant<string,int64_t,string>",
        )
        raw_bytes = ostream.getvalue()
        var_val = serializer.decode(
            raw_bytes, "variant<string,int64_t,string>"
        )
        self.assertEqual(var_val, variant)

        ostream = io.BytesIO()
        mapping = {"aa": Variant(0, 5), "bbb": Variant(1, "ccccc")}
        serializer.encode(
            ostream,
            mapping,
            "mapping<string,variant<int64_t,string>>",
        )
        raw_bytes = ostream.getvalue()
        mapping_val = serializer.decode(
            raw_bytes, "mapping<string,variant<int64_t,string>>"
        )
        self.assertEqual(mapping_val, mapping)

    def _check_val(self, typename, val):
        bstream = io.BytesIO()
        gtirb.AuxData.serializer.encode(bstream, val, typename)
        result = gtirb.AuxData.serializer.decode(bstream.getvalue(), typename)
        self.assertEqual(result, val)

    def test_int_serializers(self):
        # Signed types
        def _test_range(typename, minval, maxval):
            self._check_val(typename, 127)
            self._check_val(typename, minval)
            self._check_val(typename, maxval)

        _test_range("int8_t", -(2**7), (2**7) - 1)
        _test_range("int16_t", -(2**15), (2**15) - 1)
        _test_range("int32_t", -(2**31), (2**31) - 1)
        _test_range("int64_t", -(2**63), (2**63) - 1)
        _test_range("uint8_t", 0, (2**8) - 1)
        _test_range("uint16_t", 0, (2**16) - 1)
        _test_range("uint32_t", 0, (2**32) - 1)
        _test_range("uint64_t", 0, (2**64) - 1)

    def test_float_serializers(self):
        self._check_val("float", 0.4000000059604645)
        self._check_val("double", 0.4)


if __name__ == "__main__":
    unittest.main()


================================================
FILE: python/tests/test_symbolic_expression.py
================================================
import io
import unittest

from helpers import create_interval_etc

import gtirb


class SymbolicExpressionAttributes(unittest.TestCase):
    def test_unknown_attributes(self):
        ir, m, s, bi = create_interval_etc(address=0x1000, size=5)
        sym = gtirb.Symbol(name="foo")
        m.symbols.add(sym)
        expr = gtirb.SymAddrConst(
            0, sym, {gtirb.SymbolicExpression.Attribute.GOT, 0xBEEF}
        )
        bi.symbolic_expressions[0] = expr

        out = io.BytesIO()
        ir.save_protobuf_file(out)
        out.seek(0)

        ir = gtirb.IR.load_protobuf_file(out)
        bi = next(ir.byte_intervals)
        expr = bi.symbolic_expressions[0]

        self.assertTrue(
            gtirb.SymbolicExpression.Attribute.GOT in expr.attributes
        )
        self.assertTrue(0xBEEF in expr.attributes)


================================================
FILE: python/tests/test_symbolic_expressions_at.py
================================================
import unittest

from helpers import SearchScope, create_interval_etc, parameterize_one

import gtirb


class SymbolicExpressionsAtTests(unittest.TestCase):
    @parameterize_one("scope", list(SearchScope))
    def test_symbolic_expressions_at(self, scope):
        ir, m, s, bi = create_interval_etc(address=0x1000, size=5)
        search_in = scope.select(ir, m, s, bi)

        sym = gtirb.Symbol(name="hello")
        expr = gtirb.SymAddrConst(0, sym)
        bi.symbolic_expressions[1] = expr
        bi.symbolic_expressions[2] = expr
        bi.symbolic_expressions[3] = expr
        bi.symbolic_expressions[4] = expr

        found = set(search_in.symbolic_expressions_at(0x1001))
        self.assertEqual(found, {(bi, 1, expr)})

        found = set(search_in.symbolic_expressions_at(range(0x1000, 0x1004)))
        self.assertEqual(found, {(bi, 1, expr), (bi, 2, expr), (bi, 3, expr)})

        found = set(
            search_in.symbolic_expressions_at(range(0x1000, 0x1004, 2))
        )
        self.assertEqual(found, {(bi, 2, expr)})

        # Now just verify that the index updates correctly when deleting
        del bi.symbolic_expressions[1]

        found = set(search_in.symbolic_expressions_at(0x1001))
        self.assertEqual(found, set())


================================================
FILE: python/tests/test_wrapper.py
================================================
import unittest

import gtirb.util


class RecordingList(gtirb.util.ListWrapper):
    def __init__(self, *args):
        self.record = []
        super().__init__(*args)

    def _add(self, value):
        self.record.append(("add", value))

    def _remove(self, value):
        self.record.append(("remove", value))


class ListWrapperTests(unittest.TestCase):
    def test_empty_init(self):
        lst = RecordingList()
        self.assertFalse(lst.record)

    def test_values_init(self):
        lst = RecordingList(["A", "B", "C"])
        self.assertEqual(
            lst.record, [("add", "A"), ("add", "B"), ("add", "C")]
        )

    def test_getitem_int(self):
        lst = RecordingList(["A", "B", "C"])
        self.assertEqual(lst[0], "A")
        self.assertEqual(lst[1], "B")
        self.assertEqual(lst[2], "C")

    def test_getitem_slice(self):
        lst = RecordingList(["A", "B", "C"])
        self.assertEqual(lst[1:2], ["B"])
        self.assertEqual(lst[:2], ["A", "B"])
        self.assertEqual(lst[1:], ["B", "C"])

    def test_setitem_int(self):
        lst = RecordingList(["A", "B", "C"])
        lst[1] = "D"
        self.assertEqual(list(lst), ["A", "D", "C"])
        self.assertEqual(
            lst.record,
            [
                ("add", "A"),
                ("add", "B"),
                ("add", "C"),
                ("remove", "B"),
                ("add", "D"),
            ],
        )

    def test_setitem_slice(self):
        lst = RecordingList(["A", "B", "C"])
        lst[1:2] = ["D", "E"]
        self.assertEqual(list(lst), ["A", "D", "E", "C"])
        self.assertEqual(
            lst.record,
            [
                ("add", "A"),
                ("add", "B"),
                ("add", "C"),
                ("remove", "B"),
                ("add", "D"),
                ("add", "E"),
            ],
        )

    def test_delitem_int(self):
        lst = RecordingList(["A", "B"])
        del lst[0]
        self.assertEqual(list(lst), ["B"])
        self.assertEqual(
            lst.record, [("add", "A"), ("add", "B"), ("remove", "A")]
        )

    def test_delitem_slice(self):
        lst = RecordingList(["A", "B", "C"])
        del lst[1:]
        self.assertEqual(list(lst), ["A"])
        self.assertEqual(
            lst.record,
            [
                ("add", "A"),
                ("add", "B"),
                ("add", "C"),
                ("remove", "B"),
                ("remove", "C"),
            ],
        )

    def test_len(self):
        lst = RecordingList(["A", "B", "C"])
        self.assertEqual(len(lst), 3)

    def test_insert(self):
        lst = RecordingList(["A", "B"])
        lst.insert(1, "C")
        self.assertEqual(list(lst), ["A", "C", "B"])
        self.assertEqual(
            lst.record, [("add", "A"), ("add", "B"), ("add", "C")]
        )

    def test_append(self):
        lst = RecordingList(["A", "B"])
        lst.append("C")
        self.assertEqual(list(lst), ["A", "B", "C"])
        self.assertEqual(
            lst.record, [("add", "A"), ("add", "B"), ("add", "C")]
        )

    def test_remove(self):
        lst = RecordingList(["A", "B"])
        lst.remove("A")
        self.assertEqual(list(lst), ["B"])
        self.assertEqual(
            lst.record, [("add", "A"), ("add", "B"), ("remove", "A")]
        )

    def test_extend(self):
        lst = RecordingList()
        lst.extend(["A", "B"])
        self.assertEqual(list(lst), ["A", "B"])
        self.assertEqual(lst.record, [("add", "A"), ("add", "B")])

    def test_str(self):
        lst = RecordingList(["A", "B"])
        self.assertEqual(str(lst), str(["A", "B"]))


================================================
FILE: python/tox.ini
================================================
[tox]
requires =
    tox >= 4
    tox-uv >= 1.0

env_list =
    mypy
    py3{8-13}-{oldest,prerelease}
    report

[testenv]
package = wheel
setenv =
    COVERAGE_FILE = .coverage.{envname}
# Work around https://github.com/tox-dev/tox-uv/issues/195. Fixed in 1.26.0,
# which we can require once we finally drop support for python 3.8.
install_command = uv pip install {packages}

[testenv:mypy]
description = check types with mypy
deps = -r requirements-mypy.txt
commands = mypy gtirb

[testenv:py3{8-13}-{oldest,newest,prerelease}]
# Test environments for supported python versions. Use py3*-oldest to test using
# oldest supported dependencies, py3*-newest to test using the newest supported
# dependencies, and py3*-prerelease to test using prerelease dependency versions
# (if available).
description = run the tests with pytest under {envname}
deps = -r requirements-dev.txt
uv_resolution =
    {newest,prerelease}: highest  # install the newest available versions
    oldest: lowest-direct         # install the oldest available versions
pip_pre =
    prerelease: true              # install pre-release versions
    {oldest,newest}: false        # do not install pre-release versions
commands =
    pytest {posargs:--cov --junit-xml=junit-{envname}.xml --junit-prefix={envname}}

[testenv:report]
# Combine coverage reports.
description = report coverage from recent tests
depends = py3{8-13}-{oldest,prerelease}
skip_install = true
deps = -r requirements-dev.txt
setenv =
    COVERAGE_FILE = .coverage
commands =
    coverage combine
    # Always write the XML report.
    coverage xml --fail-under=0
    # Report to the terminal and fail if coverage is under threshold.
    coverage report


================================================
FILE: python/version.py.in
================================================
# Build with CMake to ensure consistent versions across all supported languages.
API_VERSION = (
    "@PROJECT_VERSION_MAJOR@."
    "@PROJECT_VERSION_MINOR@."
    "@PROJECT_VERSION_PATCH@"
    "@GTIRB_PYTHON_DEV_SUFFIX@"
)  # type: str
"""The semantic version of this API."""

PROTOBUF_VERSION = @GTIRB_PROTOBUF_VERSION@  # type: int
"""The version of Protobuf this API can read and write from.
Attempts to load old Protobuf versions will raise a ``ValueError``.
"""


================================================
FILE: resources/windows_version_resource.rc.in
================================================
#include <winresrc.h>

#define VER_FILEVERSION             @GTIRB_MAJOR_VERSION@,@GTIRB_MINOR_VERSION@,@GTIRB_PATCH_VERSION@,0
#define VER_FILEVERSION_STR         "@GTIRB_MAJOR_VERSION@.@GTIRB_MINOR_VERSION@.@GTIRB_PATCH_VERSION@.0\0"

#define VER_PRODUCTVERSION          @GTIRB_MAJOR_VERSION@,@GTIRB_MINOR_VERSION@,@GTIRB_PATCH_VERSION@,0
#define VER_PRODUCTVERSION_STR      "@GTIRB_MAJOR_VERSION@.@GTIRB_MINOR_VERSION@.@GTIRB_PATCH_VERSION@.0\0"

#ifndef DEBUG
#define VER_DEBUG                   0
#else
#define VER_DEBUG                   VS_FF_DEBUG
#endif

#if @GTIRB_IS_PRERELEASE@
#define VER_PRERELEASE              VS_FF_PRERELEASE
#else
#define VER_PRERELEASE              0
#endif

#define VER_INTERNALNAME_STR        "@PROJECT_NAME@"
#define VER_PRODUCTNAME_STR         "@PROJECT_NAME@"
#define VER_COMPANYNAME_STR         "GrammaTech, Inc"
#define VER_FILEDESCRIPTION_STR     "Intermediate representation for binary analysis and transformation"
#define VER_LEGALCOPYRIGHT_STR      "Copyright (C) 2020 GrammaTech, Inc."

VS_VERSION_INFO VERSIONINFO
FILEVERSION     VER_FILEVERSION
PRODUCTVERSION  VER_PRODUCTVERSION
FILEFLAGSMASK   VS_FFI_FILEFLAGSMASK
FILEFLAGS       (VER_PRERELEASE|VER_DEBUG)
FILEOS          VOS__WINDOWS32
FILETYPE        VFT_DLL
FILESUBTYPE     VFT2_UNKNOWN
BEGIN
    BLOCK "StringFileInfo"
    BEGIN
        BLOCK "040904E4"
        BEGIN
            VALUE "CompanyName",      VER_COMPANYNAME_STR
            VALUE "FileDescription",  VER_FILEDESCRIPTION_STR
            VALUE "FileVersion",      VER_FILEVERSION_STR
            VALUE "InternalName",     VER_INTERNALNAME_STR
            VALUE "LegalCopyright",   VER_LEGALCOPYRIGHT_STR
            VALUE "ProductName",      VER_PRODUCTNAME_STR
            VALUE "ProductVersion",   VER_PRODUCTVERSION_STR
        END
    END

    BLOCK "VarFileInfo"
    BEGIN
        /* The following line should only be modified for localized versions.     */
        /* It consists of any number of WORD,WORD pairs, with each pair           */
        /* describing a language,codepage combination supported by the file.      */
        /*                                                                        */
        /* For example, a file might have values "0x409,1252" indicating that it  */
        /* supports English language (0x409) in the Windows ANSI codepage (1252). */

        VALUE "Translation", 0x409, 1252
    END
END


================================================
FILE: src/AuxData.cpp
================================================
//===- AuxData.cpp ---------------------------------------------*- C++-*-===//
//
//  Copyright (C) 2020 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
#include "AuxData.hpp"
#include <gtirb/proto/AuxData.pb.h>

namespace gtirb {
void AuxData::fromProtobuf(AuxData& Result, const MessageType& Message) {
  Result.SF.ProtobufType = Message.type_name();
  Result.SF.RawBytes = Message.data();
}

void AuxData::toProtobuf(MessageType* Message,
                         const AuxData::SerializedForm& SFToSerialize) const {
  *Message->mutable_type_name() = SFToSerialize.ProtobufType;
  *Message->mutable_data() = SFToSerialize.RawBytes;
}

bool AuxData::checkAuxDataMessageType(const AuxData::MessageType& Message,
                                      const std::string& ExpectedName) {
  return Message.type_name() == ExpectedName;
}

// Present for testing purposes only.
void AuxData::save(std::ostream& Out) const {
  MessageType Message;
  this->toProtobuf(&Message);
  Message.SerializeToOstream(&Out);
}

// Present for testing purposes only.
std::unique_ptr<AuxData>
AuxData::load(std::istream& In,
              std::unique_ptr<AuxData> (*FPPtr)(const MessageType&)) {
  MessageType Message;
  Message.ParseFromIstream(&In);
  auto AD = FPPtr(Message);
  return AD;
}
} // namespace gtirb


================================================
FILE: src/AuxDataContainer.cpp
================================================
//===- AuxDataContainer.cpp -------------------------------------*- C++ -*-===//
//
//  Copyright (C) 2020 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//

#include "AuxDataContainer.hpp"
#include "AuxData.hpp"
#include "Context.hpp"
#include "Serialization.hpp"

#include <memory>
#include <string>

namespace gtirb {

struct AuxDataTypeMap {
  bool Locked = false;
  std::map<std::string, std::unique_ptr<AuxDataContainer::AuxDataType>> Map;
};

// Note: we are explicitly allocating the type map here w/ static
// storage to avoid having a variable symbol in the DLL interface on
// Windows. This allows us to not have to worry about dllimport'ing
// this symbol in client applications.
static AuxDataTypeMap TypeMap;

void AuxDataContainer::registerAuxDataTypeInternal(
    const char* Name, std::unique_ptr<AuxDataType> ADT) {
  assert(!TypeMap.Locked && "New AuxData types cannot be added at this point.");

  if (auto it = TypeMap.Map.find(Name); it != TypeMap.Map.end()) {
    // Failing this assertion indicates that two attempts to
    // register the same AuxData name are using different types.
    assert(it->second->getApiTypeId() == ADT->getApiTypeId() &&
           "Different types registered for the same AuxData name.");
    return;
  }

  TypeMap.Map.insert(std::make_pair(std::string(Name), std::move(ADT)));
}

bool AuxDataContainer::checkAuxDataRegistration(const char* Name,
                                                std::size_t Id) {
  auto TypeEntry = TypeMap.Map.find(Name);
  return TypeEntry != TypeMap.Map.end() &&
         TypeEntry->second->getApiTypeId() == Id;
}

const AuxDataContainer::AuxDataType*
AuxDataContainer::lookupAuxDataType(const std::string& Name) {
  if (auto It = TypeMap.Map.find(Name); It != TypeMap.Map.end()) {
    return It->second.get();
  }
  return nullptr;
}

AuxDataContainer::AuxDataContainer(Context& C, Node::Kind knd) : Node(C, knd) {
  // Once this is called, we outlaw registering new AuxData types.
  TypeMap.Locked = true;
}

AuxDataContainer::AuxDataContainer(Context& C, Node::Kind knd, const UUID& U)
    : Node(C, knd, U) {
  // Once this is called, we outlaw registering new AuxData types.
  TypeMap.Locked = true;
}

}; // namespace gtirb


================================================
FILE: src/ByteInterval.cpp
================================================
//===- ByteInterval.cpp -----------------------------------------*- C++ -*-===//
//
//  Copyright (C) 2020 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
#include "IR.hpp"
#include "Serialization.hpp"
#include "SymbolicExpressionSerialization.hpp"
#include <gtirb/ByteInterval.hpp>
#include <gtirb/CodeBlock.hpp>
#include <gtirb/DataBlock.hpp>
#include <gtirb/Module.hpp>
#include <gtirb/Section.hpp>
#include <gtirb/Utility.hpp>
#include <gtirb/proto/ByteInterval.pb.h>
#include <iterator>

using namespace gtirb;

class ByteInterval::CodeBlockObserverImpl : public CodeBlockObserver {
public:
  CodeBlockObserverImpl(ByteInterval* BI_) : BI(BI_) {}

  ChangeStatus sizeChange(CodeBlock* B, uint64_t OldSize,
                          uint64_t NewSize) override;

  ChangeStatus decodeModeChange(CodeBlock* B, DecodeMode OldMode,
                                DecodeMode NewMode) override;

private:
  ByteInterval* BI;
};

class ByteInterval::DataBlockObserverImpl : public DataBlockObserver {
public:
  DataBlockObserverImpl(ByteInterval* BI_) : BI(BI_) {}

  ChangeStatus sizeChange(DataBlock* B, uint64_t OldSize,
                          uint64_t NewSize) override;

private:
  ByteInterval* BI;
};

ByteInterval::ByteInterval(Context& C) : ByteInterval(C, std::nullopt, 0, 0) {}

ByteInterval::ByteInterval(Context& C, std::optional<Addr> A, uint64_t S,
                           uint64_t InitSize)
    : Node(C, Kind::ByteInterval), Address(A), Size(S), Bytes(InitSize),
      CBO(std::make_unique<CodeBlockObserverImpl>(this)),
      DBO(std::make_unique<DataBlockObserverImpl>(this)) {}

ByteInterval::ByteInterval(Context& C, std::optional<Addr> A, uint64_t S,
                           uint64_t InitSize, const UUID& U)
    : Node(C, Kind::ByteInterval, U), Address(A), Size(S), Bytes(InitSize),
      CBO(std::make_unique<CodeBlockObserverImpl>(this)),
      DBO(std::make_unique<DataBlockObserverImpl>(this)) {}

void ByteInterval::toProtobuf(MessageType* Message) const {
  nodeUUIDToBytes(this, *Message->mutable_uuid());

  if (Address.has_value()) {
    Message->set_has_address(true);
    Message->set_address((uint64_t)*Address);
  } else {
    Message->set_has_address(false);
  }

  Message->set_size(getSize());
  auto BytesIt = bytes_begin<char>();
  auto InitSize = getInitializedSize();
  Message->mutable_contents()->reserve(InitSize);
  std::copy(BytesIt, BytesIt + InitSize,
            std::back_inserter(*Message->mutable_contents()));

  for (const auto& N : this->blocks()) {
    auto* ProtoBlock = Message->add_blocks();

    switch (N.getKind()) {
    case Node::Kind::CodeBlock: {
      auto& B = cast<CodeBlock>(N);
      ProtoBlock->set_offset(B.getOffset());
      B.toProtobuf(ProtoBlock->mutable_code());
    } break;
    case Node::Kind::DataBlock: {
      auto& B = cast<DataBlock>(N);
      ProtoBlock->set_offset(B.getOffset());
      B.toProtobuf(ProtoBlock->mutable_data());
    } break;
    default: {
      assert(!"unknown Node::Kind in ByteInterval::toProtobuf");
    }
    }
  }

  auto& ProtoSymExpr = *Message->mutable_symbolic_expressions();
  for (const auto& SEE : this->symbolic_expressions()) {
    ProtoSymExpr[SEE.getOffset()] =
        gtirb::toProtobuf(SEE.getSymbolicExpression());
  }
}

ErrorOr<ByteInterval*> ByteInterval::fromProtobuf(Context& C,
                                                  const MessageType& Message) {
  std::optional<Addr> A;
  if (Message.has_address()) {
    A = Addr(Message.address());
  }

  UUID Id;
  if (!uuidFromBytes(Message.uuid(), Id)) {
    std::stringstream ss;
    ss << "Could not load ByteInterval";
    if (A)
      ss << "@ " << *A;

    return {IR::load_error::BadUUID, ss.str()};
  }

  ByteInterval* BI = ByteInterval::Create(
      C, A, Message.contents().begin(), Message.contents().end(),
      Message.size(), Message.contents().size(), Id);
  std::stringstream ss;
  if (A) {
    ss << "@" << A;
  }
  ErrorInfo Err{IR::load_error::CorruptByteInterval, ss.str()};
  for (const auto& ProtoBlock : Message.blocks()) {
    switch (ProtoBlock.value_case()) {
    case proto::Block::ValueCase::kCode: {
      auto B = CodeBlock::fromProtobuf(C, ProtoBlock.code());
      if (!B) {
        Err.Msg += "\n" + B.getError().message();
        return Err;
      }
      BI->addBlock(ProtoBlock.offset(), *B);
    } break;
    case proto::Block::ValueCase::kData: {
      auto B = DataBlock::fromProtobuf(C, ProtoBlock.data());
      if (!B) {
        Err.Msg += "\n" + B.getError().message();
        return Err;
      }
      BI->addBlock(ProtoBlock.offset(), *B);
    } break;
    default: {
      return {IR::load_error::CorruptFile,
              "unknown Block::ValueCase in ByteInterval::fromProtobuf"};
    }
    }
  }
  return BI;
}

bool ByteInterval::symbolicExpressionsFromProtobuf(Context& C,
                                                   const MessageType& Message) {
  bool Result = true;
  for (const auto& Pair : Message.symbolic_expressions()) {
    SymbolicExpression SymExpr;
    if (gtirb::fromProtobuf(C, SymExpr, Pair.second))
      SymbolicExpressions[Pair.first] = SymExpr;
    else {
      Result = false;
      break;
    }
  }
  return Result;
}

// Present for testing purposes only.
void ByteInterval::save(std::ostream& Out) const {
  MessageType Message;
  this->toProtobuf(&Message);
  Message.SerializeToOstream(&Out);
}

// Present for testing purposes only.
ByteInterval* ByteInterval::load(Context& C, std::istream& In) {
  MessageType Message;
  Message.ParseFromIstream(&In);
  auto BI = ByteInterval::fromProtobuf(C, Message);
  if (BI) {
    return *BI;
  }
  return nullptr;
}

// Present for testing purposes only.
bool ByteInterval::loadSymbolicExpressions(Context& C, std::istream& In) {
  MessageType Message;
  Message.ParseFromIstream(&In);
  return ByteInterval::symbolicExpressionsFromProtobuf(C, Message);
}

void ByteInterval::setAddress(std::optional<Addr> A) {
  if (Observer) {
    [[maybe_unused]] ChangeStatus Status = Observer->changeExtent(
        this, [&A](ByteInterval* BI) { BI->Address = A; });
    assert(Status != ChangeStatus::Rejected &&
           "recovering from rejected address change is not implemented yet");
    Status = Observer->moveCodeBlocks(this, code_blocks());
    assert(Status != ChangeStatus::Rejected &&
           "recovering from rejected address change is not implemented yet");
    Status = Observer->moveDataBlocks(this, data_blocks());
    assert(Status != ChangeStatus::Rejected &&
           "recovering from rejected address change is not implemented yet");
  } else {
    Address = A;
  }
}

void ByteInterval::setSize(uint64_t S) {
  if (Observer) {
    [[maybe_unused]] ChangeStatus Status =
        Observer->changeExtent(this, [&S](ByteInterval* BI) { BI->Size = S; });
    assert(Status != ChangeStatus::Rejected &&
           "recovering from rejected size change is not implemented yet");
  } else {
    Size = S;
  }
  if (S < getInitializedSize()) {
    setInitializedSize(S);
  }
}

static inline ChangeStatus removeBlocks(ByteIntervalObserver* Observer,
                                        ByteInterval* BI,
                                        ByteInterval::code_block_range Range) {
  return Observer->removeCodeBlocks(BI, Range);
}

static inline ChangeStatus removeBlocks(ByteIntervalObserver* Observer,
                                        ByteInterval* BI,
                                        ByteInterval::data_block_range Range) {
  return Observer->removeDataBlocks(BI, Range);
}

template <typename BlockType, typename IterType>
ChangeStatus ByteInterval::removeBlock(BlockType* B) {
  auto& Index = Blocks.get<by_pointer>();
  if (auto Iter = Index.find(B); Iter != Index.end()) {
    if (Observer) {
      auto Begin = Blocks.project<0>(Iter);
      auto End = std::next(Begin);
      auto Range = boost::make_iterator_range(
          IterType(typename IterType::base_type(Begin, End)),
          IterType(typename IterType::base_type(End, End)));
      [[maybe_unused]] ChangeStatus Status =
          removeBlocks(Observer, this, Range);
      // None of the known observers reject removals. If that changes, this
      // implementation will need to be changed as well. Because addBlock
      // assumes that this removal will not be rejected, it will also need to
      // be updated.
      assert(Status != ChangeStatus::Rejected &&
             "recovering from rejected removal is not implemented yet");
    }

    updateIntervalMap(B, B->getSize(), std::nullopt);
    Index.erase(Iter);
    B->setParent(nullptr, nullptr);
    return ChangeStatus::Accepted;
  }
  return ChangeStatus::NoChange;
}

ChangeStatus ByteInterval::removeBlock(CodeBlock* B) {
  return removeBlock<CodeBlock, code_block_iterator>(B);
}

ChangeStatus ByteInterval::removeBlock(DataBlock* B) {
  return removeBlock<DataBlock, data_block_iterator>(B);
}

static inline CodeBlockObserver* getObserver(CodeBlock*, CodeBlockObserver* CBO,
                                             DataBlockObserver*) {
  return CBO;
}

static inline DataBlockObserver* getObserver(DataBlock*, CodeBlockObserver*,
                                             DataBlockObserver* DBO) {
  return DBO;
}

static inline ChangeStatus addBlocks(ByteIntervalObserver* Observer,
                                     ByteInterval* BI,
                                     ByteInterval::code_block_range Range) {
  return Observer->addCodeBlocks(BI, Range);
}

static inline ChangeStatus addBlocks(ByteIntervalObserver* Observer,
                                     ByteInterval* BI,
                                     ByteInterval::data_block_range Range) {
  return Observer->addDataBlocks(BI, Range);
}

static inline ChangeStatus moveBlocks(ByteIntervalObserver* Observer,
                                      ByteInterval* BI,
                                      ByteInterval::code_block_range Range) {
  return Observer->moveCodeBlocks(BI, Range);
}

static inline ChangeStatus moveBlocks(ByteIntervalObserver* Observer,
                                      ByteInterval* BI,
                                      ByteInterval::data_block_range Range) {
  return Observer->moveDataBlocks(BI, Range);
}

template <typename BlockType, typename IterType>
ChangeStatus ByteInterval::addBlock(uint64_t Off, BlockType* B) {
  // Determine if we're moving or adding a block.
  bool IsMove = false;
  ByteInterval* BI = B->getByteInterval();
  if (BI == this) {
    if (Off == B->getOffset()) {
      return ChangeStatus::NoChange;
    } else {
      IsMove = true;
    }
  }

  // Remove the old block.
  if (!IsMove) {
    if (BI) {
      [[maybe_unused]] ChangeStatus Status = BI->removeBlock(B);
      assert(Status != ChangeStatus::Rejected &&
             "failed to remove node from parent");
    }

    B->setParent(this, getObserver(B, CBO.get(), DBO.get()));
  }

  // Remove the block from the interval map at the old offset.
  if (IsMove) {
    updateIntervalMap(B, B->getSize(), std::nullopt);
  }

  // Actually modify the offset.
  auto Begin = Blocks.get<by_offset>().end();
  if (IsMove) {
    Blocks.get<by_pointer>().modify(Blocks.get<by_pointer>().find(B),
                                    [Off](auto& Entry) { Entry.Offset = Off; });
    Begin = Blocks.project<by_offset>(Blocks.get<by_pointer>().find(B));
  } else {
    Begin = Blocks.emplace(Off, B).first;
  }

  // Add the block to the interval map at the new offset.
  updateIntervalMap(B, std::nullopt, B->getSize());

  // Only fire events if we have an observer.
  if (!Observer) {
    return ChangeStatus::Accepted;
  }

  // Get the range to use.
  assert(Begin != Blocks.get<by_offset>().end());
  auto End = std::next(Begin);
  auto Range = boost::make_iterator_range(
      IterType(typename IterType::base_type(Begin, End)),
      IterType(typename IterType::base_type(End, End)));

  // Fire the move/add event.
  [[maybe_unused]] ChangeStatus Status;
  if (IsMove) {
    Status = moveBlocks(Observer, this, Range);
  } else {
    Status = addBlocks(Observer, this, Range);
  }

  // None of the known observers reject insertions. If that changes, this
  // implementation must be updated.
  assert(Status != ChangeStatus::Rejected &&
         "recovering from rejected insertion is unimplemented");

  // All good.
  return ChangeStatus::Accepted;
}

ChangeStatus ByteInterval::addBlock(uint64_t Off, CodeBlock* B) {
  return addBlock<CodeBlock, code_block_iterator>(Off, B);
}

ChangeStatus ByteInterval::addBlock(uint64_t Off, DataBlock* B) {
  return addBlock<DataBlock, data_block_iterator>(Off, B);
}

ChangeStatus ByteInterval::CodeBlockObserverImpl::sizeChange(CodeBlock* B,
                                                             uint64_t OldSize,
                                                             uint64_t NewSize) {
  return BI->sizeChange(B, OldSize, NewSize);
}

ChangeStatus ByteInterval::CodeBlockObserverImpl::decodeModeChange(
    CodeBlock* B, DecodeMode OldMode, DecodeMode NewMode) {
  return BI->decodeModeChange(B, OldMode, NewMode);
}

ChangeStatus ByteInterval::DataBlockObserverImpl::sizeChange(DataBlock* B,
                                                             uint64_t OldSize,
                                                             uint64_t NewSize) {
  return BI->sizeChange(B, OldSize, NewSize);
}

void ByteInterval::updateIntervalMap(Node* N, std::optional<uint64_t> OldSize,
                                     std::optional<uint64_t> NewSize) {
  auto& Index = Blocks.get<by_pointer>();
  auto Iter = Index.find(N);
  assert(Iter != Index.end() && "block observed by non-owner");
  if (OldSize)
    BlockOffsets.subtract(
        std::make_pair(ByteInterval::BlockIntMap::interval_type::right_open(
                           Iter->Offset, Iter->Offset + *OldSize),
                       ByteInterval::BlockIntMap::codomain_type({&*Iter})));
  if (NewSize)
    BlockOffsets.add(
        std::make_pair(ByteInterval::BlockIntMap::interval_type::right_open(
                           Iter->Offset, Iter->Offset + *NewSize),
                       ByteInterval::BlockIntMap::codomain_type({&*Iter})));
}

void ByteInterval::updateBlockSortOrder(Node* N) {
  auto& Index = Blocks.get<by_pointer>();
  auto Iter = Index.find(N);
  assert(Iter != Index.end() && "block observed by non-owner");
  Blocks.get<by_pointer>().modify(Iter, [](auto&) {});
}

ChangeStatus ByteInterval::sizeChange(Node* N, uint64_t OldSize,
                                      uint64_t NewSize) {
  updateIntervalMap(N, OldSize, NewSize);
  updateBlockSortOrder(N);
  return ChangeStatus::Accepted;
}

ChangeStatus ByteInterval::decodeModeChange(CodeBlock* B, DecodeMode,
                                            DecodeMode) {
  updateBlockSortOrder(B);
  return ChangeStatus::Accepted;
}

boost::endian::order gtirb::ByteInterval::getBoostEndianOrder() const {
  if (auto* S = getSection()) {
    if (auto* M = S->getModule()) {
      switch (M->getByteOrder()) {
      case (ByteOrder::Big):
        return boost::endian::order::big;
      case (ByteOrder::Little):
        return boost::endian::order::little;
      default:
        return boost::endian::order::native;
      }
    }
  }

  return boost::endian::order::native;
}


================================================
FILE: src/CFG.cpp
================================================
//===- CFG.cpp --------------------------------------------------*- C++ -*-===//
//
//  Copyright (C) 2021 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
#include "CFG.hpp"
#include "Serialization.hpp"
#include <gtirb/CodeBlock.hpp>
#include <gtirb/proto/CFG.pb.h>
#include <map>
#include <tuple>

namespace gtirb {
GTIRB_EXPORT_API std::ostream& operator<<(std::ostream& OS,
                                          const ConditionalEdge& CE) {
  switch (CE) {
  case ConditionalEdge::OnFalse:
    OS << "OnFalse";
    break;
  case ConditionalEdge::OnTrue:
    OS << "OnTrue";
    break;
  }
  return OS;
}

GTIRB_EXPORT_API std::ostream& operator<<(std::ostream& OS,
                                          const EdgeType& ET) {
  switch (ET) {
  case EdgeType::Branch:
    OS << "Branch";
    break;
  case EdgeType::Call:
    OS << "Call";
    break;
  case EdgeType::Fallthrough:
    OS << "Fallthrough";
    break;
  case EdgeType::Return:
    OS << "Return";
    break;
  case EdgeType::Syscall:
    OS << "Syscall";
    break;
  case EdgeType::Sysret:
    OS << "Sysret";
    break;
  }
  return OS;
}

GTIRB_EXPORT_API std::ostream& operator<<(std::ostream& OS,
                                          const DirectEdge& DE) {
  switch (DE) {
  case DirectEdge::IsIndirect:
    OS << "IsIndirect";
    break;
  case DirectEdge::IsDirect:
    OS << "IsDirect";
    break;
  }
  return OS;
}

GTIRB_EXPORT_API std::ostream& operator<<(std::ostream& OS,
                                          const EdgeLabel& Label) {
  if (!Label) {
    OS << "<No EdgeLabel>";
  } else {
    auto ET = std::get<EdgeType>(*Label);
    auto DE = std::get<DirectEdge>(*Label);
    auto CE = std::get<ConditionalEdge>(*Label);
    OS << "(" << CE << ", " << DE << ", " << ET << ")";
  }
  return OS;
}

std::pair<CFG::vertex_descriptor, bool> addVertex(CfgNode* B, CFG& Cfg) {
  auto& IdTable = Cfg[boost::graph_bundle];
  if (auto it = IdTable.find(B); it != IdTable.end()) {
    return std::make_pair(it->second, false);
  }

  auto Vertex = add_vertex(Cfg);
  Cfg[Vertex] = B;
  IdTable[B] = Vertex;
  return std::make_pair(Vertex, true);
}

bool removeVertex(CfgNode* N, CFG& Cfg) {
  auto& IdTable = Cfg[boost::graph_bundle];
  if (auto it = IdTable.find(N); it != IdTable.end()) {
    clear_vertex(it->second, Cfg);
    remove_vertex(it->second, Cfg);
    IdTable.erase(it);
    return true;
  }
  return false;
}

std::optional<CFG::vertex_descriptor> getVertex(const CfgNode* N,
                                                const CFG& Cfg) {
  auto& IdTable = Cfg[boost::graph_bundle];
  if (auto it = IdTable.find(N); it != IdTable.end()) {
    return it->second;
  }
  return std::nullopt;
}

std::optional<CFG::edge_descriptor> addEdge(const CfgNode* From,
                                            const CfgNode* To, CFG& Cfg) {
  const auto& IdTable = Cfg[boost::graph_bundle];
  if (auto it = IdTable.find(From); it != IdTable.end()) {
    auto FromVertex = it->second;
    if (it = IdTable.find(To); it != IdTable.end()) {
      auto ToVertex = it->second;
      return add_edge(FromVertex, ToVertex, Cfg).first;
    }
  }
  return std::nullopt;
}

bool removeEdge(const CfgNode* From, const CfgNode* To, CFG& Cfg) {
  const auto& IdTable = Cfg[boost::graph_bundle];
  if (auto it = IdTable.find(From); it != IdTable.end()) {
    auto FromVertex = it->second;
    if (it = IdTable.find(To); it != IdTable.end()) {
      auto ToVertex = it->second;
      remove_edge(FromVertex, ToVertex, Cfg);
      return true;
    }
  }
  return false;
}

bool removeEdge(const CfgNode* From, const CfgNode* To, const EdgeLabel Label,
                CFG& Cfg) {
  bool remove_called = true, deleted = false;
  const auto& IdTable = Cfg[boost::graph_bundle];
  boost::graph_traits<CFG>::out_edge_iterator ei, edge_end;
  if (auto it = IdTable.find(From); it != IdTable.end()) {
    auto FromVertex = it->second;
    if (it = IdTable.find(To); it != IdTable.end()) {
      while (remove_called) {
        remove_called = false;
        for (boost::tie(ei, edge_end) = out_edges(FromVertex, Cfg);
             ei != edge_end; ++ei) {
          if (Cfg[*ei] == Label) {
            remove_edge(ei, Cfg);
            // As remove_edge invalidate all iterators
            // the iteration process should be restarted
            remove_called = true;
            deleted = true;
            break;
          }
        }
      }
    }
  }
  return deleted;
}

boost::iterator_range<const_cfg_iterator> nodes(const CFG& Cfg) {
  auto Vs = vertices(Cfg);
  return boost::make_iterator_range(
      const_cfg_iterator(cfg_node_iter_base(Cfg, Vs.first)),
      const_cfg_iterator(cfg_node_iter_base(Cfg, Vs.second)));
}

boost::iterator_range<cfg_iterator> nodes(CFG& Cfg) {
  auto Vs = vertices(Cfg);
  return boost::make_iterator_range(
      cfg_iterator(cfg_node_iter_base(Cfg, Vs.first)),
      cfg_iterator(cfg_node_iter_base(Cfg, Vs.second)));
}

boost::iterator_range<const_block_iterator> blocks(const CFG& Cfg) {
  auto Vs = vertices(Cfg);
  return boost::make_iterator_range(
      const_block_iterator(Cfg, Vs.first, Vs.second),
      const_block_iterator(Cfg, Vs.second, Vs.second));
}

boost::iterator_range<block_iterator> blocks(CFG& Cfg) {
  auto Vs = vertices(Cfg);
  return boost::make_iterator_range(block_iterator(Cfg, Vs.first, Vs.second),
                                    block_iterator(Cfg, Vs.second, Vs.second));
}

proto::CFG toProtobuf(const CFG& Cfg) {
  proto::CFG Message;
  auto MessageVertices = Message.mutable_vertices();
  for (const Node& N : nodes(Cfg)) {
    auto* M = MessageVertices->Add();
    nodeUUIDToBytes(&N, *M);
  }

  auto MessageEdges = Message.mutable_edges();
  for (const auto& E : boost::make_iterator_range(edges(Cfg))) {
    auto M = MessageEdges->Add();
    nodeUUIDToBytes(Cfg[source(E, Cfg)], *M->mutable_source_uuid());
    nodeUUIDToBytes(Cfg[target(E, Cfg)], *M->mutable_target_uuid());
    if (auto Label = Cfg[E]) {
      auto* L = M->mutable_label();
      L->set_conditional(std::get<ConditionalEdge>(*Label) ==
                         ConditionalEdge::OnTrue);
      L->set_direct(std::get<DirectEdge>(*Label) == DirectEdge::IsDirect);
      L->set_type(static_cast<proto::EdgeType>(std::get<EdgeType>(*Label)));
    }
  }
  return Message;
}

bool fromProtobuf(Context& C, CFG& Result, const proto::CFG& Message) {
  // Because we're deserializing, we have to assume the data is attacker-
  // controlled and may be malicious. We cannot use cast<> because an attacker
  // could specify the UUID to a node of the incorrect type. Instead, we use
  // dyn_cast<> and assert as needed.
  for (const auto& M : Message.vertices()) {
    UUID Id;
    if (!uuidFromBytes(M, Id))
      return false;
    auto* N = dyn_cast_or_null<CfgNode>(Node::getByUUID(C, Id));
    assert(N && "CFG message contains vertex that is not a CfgNode!");
    if (!N)
      return false;
    addVertex(N, Result);
  }
  for (const auto& M : Message.edges()) {
    UUID Id;
    if (!uuidFromBytes(M.source_uuid(), Id))
      return false;
    CfgNode* Source = dyn_cast_or_null<CfgNode>(Node::getByUUID(C, Id));

    if (!uuidFromBytes(M.target_uuid(), Id))
      return false;
    CfgNode* Target = dyn_cast_or_null<CfgNode>(Node::getByUUID(C, Id));
    if (Source && Target) {
      if (auto E = addEdge(Source, Target, Result); E && M.has_label()) {
        auto& L = M.label();
        Result[*E] = std::make_tuple(L.conditional() ? ConditionalEdge::OnTrue
                                                     : ConditionalEdge::OnFalse,
                                     L.direct() ? DirectEdge::IsDirect
                                                : DirectEdge::IsIndirect,
                                     static_cast<EdgeType>(L.type()));
      }
    }
  }
  return true;
}

// This function is defined here w/ GTIRB_EXPORT_API to provide a
// means for test code to directly invoke serialization routines on a
// CFG. This is a capability not supported for GTIRB clients, but must
// be made available to the testing system.
void GTIRB_EXPORT_API cfgSave(const CFG& Cfg, std::ostream& Out) {
  proto::CFG Message = toProtobuf(Cfg);
  Message.SerializeToOstream(&Out);
}

// This function is defined here w/ GTIRB_EXPORT_API to provide a
// means for test code to directly invoke serialization routines on a
// CFG. This is a capability not supported for GTIRB clients, but must
// be made available to the testing system.
void GTIRB_EXPORT_API cfgLoad(Context& C, CFG& Result, std::istream& In) {
  proto::CFG Message;
  Message.ParseFromIstream(&In);
  (void)fromProtobuf(C, Result, Message);
}

} // namespace gtirb


================================================
FILE: src/CFGSerialization.hpp
================================================
//===- CFGSerialization.hpp -------------------------------------*- C++ -*-===//
//
//  Copyright (C) 2020 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//

#ifndef GTIRB_CFG_SERIALIZATION_HPP
#define GTIRB_CFG_SERIALIZATION_HPP

#include <gtirb/CFG.hpp>

namespace gtirb {
class Context;
namespace proto {
class CFG;
}

/// @cond INTERNAL
/// \ingroup CFG_GROUP
/// \brief Serialize a \ref CFG into a protobuf message.
///
/// \param Cfg   The CFG to serialize.
///
/// \return A protobuf message representing the \ref CFG and its
/// component blocks (\ref Block).
proto::CFG toProtobuf(const CFG& Cfg);

/// \ingroup CFG_GROUP
/// \brief Initialize a \ref CFG from a protobuf message.
///
/// \param      C        The Context in which the deserialized CFG will be held.
/// \param      Message  The protobuf message from which to deserialize.
/// \param[out] Result   The CFG to initialize.
///
/// \return true if the \ref CFG could be deserialized, false otherwise.
bool fromProtobuf(Context& C, CFG& Result, const proto::CFG& Message);
/// @endcond

} // namespace gtirb

#endif // GTIRB_CFG_SERIALIZATION_HPP


================================================
FILE: src/CMakeLists.txt
================================================
set(PROJECT_NAME gtirb)

add_subdirectory(gtirb/proto)

if(GTIRB_RUN_CLANG_TIDY)
  find_program(
    CLANG_TIDY_EXE
    NAMES "clang-tidy"
    DOC "Path to clang-tidy executable"
  )
  if(NOT CLANG_TIDY_EXE)
    message(STATUS "clang-tidy not found.")
  else()
    message(STATUS "clang-tidy found: ${CLANG_TIDY_EXE}")
  endif()
else()
  message(STATUS "clang-tidy disabled.")
endif()

if(${CMAKE_CXX_COMPILER_ID} STREQUAL MSVC)
  # add_compile_options(-wd4251)  # Non-exportable template classes.
  add_compile_options(-DBOOST_UUID_RANDOM_PROVIDER_FORCE_WINCRYPT)
elseif(${CMAKE_CXX_COMPILER_ID} STREQUAL GNU)
  # add_compile_options(-Wno-unused-function)
  add_compile_options(-mtune=generic)
  add_compile_options(-pthread)
elseif(${CMAKE_CXX_COMPILER_ID} STREQUAL Clang)
  # add_compile_options(-Wno-unused-function)
  add_compile_options(-mtune=generic)
  add_compile_options(-pthread)
endif()

# generate version.h from version.h.in
configure_file(
  "${CMAKE_SOURCE_DIR}/include/gtirb/version.h.in"
  "${CMAKE_BINARY_DIR}/include/gtirb/version.h" @ONLY
)

# specify header files that need to be installed
set(${PROJECT_NAME}_H
    "${CMAKE_SOURCE_DIR}/include/gtirb/Addr.hpp"
    "${CMAKE_SOURCE_DIR}/include/gtirb/Allocator.hpp"
    "${CMAKE_SOURCE_DIR}/include/gtirb/AuxData.hpp"
    "${CMAKE_SOURCE_DIR}/include/gtirb/AuxDataContainer.hpp"
    "${CMAKE_SOURCE_DIR}/include/gtirb/AuxDataSchema.hpp"
    "${CMAKE_SOURCE_DIR}/include/gtirb/ByteInterval.hpp"
    "${CMAKE_SOURCE_DIR}/include/gtirb/CFG.hpp"
    "${CMAKE_SOURCE_DIR}/include/gtirb/Casting.hpp"
    "${CMAKE_SOURCE_DIR}/include/gtirb/CfgNode.hpp"
    "${CMAKE_SOURCE_DIR}/include/gtirb/CodeBlock.hpp"
    "${CMAKE_SOURCE_DIR}/include/gtirb/Context.hpp"
    "${CMAKE_SOURCE_DIR}/include/gtirb/DataBlock.hpp"
    "${CMAKE_SOURCE_DIR}/include/gtirb/DecodeMode.hpp"
    "${CMAKE_SOURCE_DIR}/include/gtirb/ErrorOr.hpp"
    "${CMAKE_SOURCE_DIR}/include/gtirb/Export.hpp"
    "${CMAKE_SOURCE_DIR}/include/gtirb/IR.hpp"
    "${CMAKE_SOURCE_DIR}/include/gtirb/Module.hpp"
    "${CMAKE_SOURCE_DIR}/include/gtirb/Node.hpp"
    "${CMAKE_SOURCE_DIR}/include/gtirb/Observer.hpp"
    "${CMAKE_SOURCE_DIR}/include/gtirb/Offset.hpp"
    "${CMAKE_SOURCE_DIR}/include/gtirb/ProxyBlock.hpp"
    "${CMAKE_SOURCE_DIR}/include/gtirb/Section.hpp"
    "${CMAKE_SOURCE_DIR}/include/gtirb/Symbol.hpp"
    "${CMAKE_SOURCE_DIR}/include/gtirb/SymbolicExpression.hpp"
    "${CMAKE_SOURCE_DIR}/include/gtirb/Utility.hpp"
    "${CMAKE_SOURCE_DIR}/include/gtirb/gtirb.hpp"
)

# specify source files
set(${PROJECT_NAME}_SRC
    AuxData.cpp
    AuxDataContainer.cpp
    ByteInterval.cpp
    CodeBlock.cpp
    Context.cpp
    CFG.cpp
    DataBlock.cpp
    ErrorOr.cpp
    IR.cpp
    Module.cpp
    Node.cpp
    Offset.cpp
    ProxyBlock.cpp
    Section.cpp
    Serialization.cpp
    Symbol.cpp
    SymbolicExpression.cpp
    Utility.cpp
)

file(GLOB ProtoFiles "${CMAKE_CURRENT_SOURCE_DIR}/gtirb/proto/*.proto")
set(${PROJECT_NAME}_PROTO ${ProtoFiles})
source_group("proto" FILES ${ProtoFiles})

if(UNIX AND NOT WIN32)
  set(SYSLIBS ${CMAKE_DL_LIBS})
else()
  set(SYSLIBS)
endif()

gtirb_add_library()
# FIXME We should be setting SOVERSION with an ABI version number once the ABI
# stabilizes. For now, since most patches affect the ABI anyway, we just use the
# GTIRB_VERSION as the SOVERSION.
set_target_properties(${PROJECT_NAME} PROPERTIES VERSION ${GTIRB_VERSION})
if(WIN32)
  # FIXME: We need to figure out how to handle cutting a release build. For the
  # moment, treat everything as a pre-release build.
  set(GTIRB_IS_PRERELEASE 1)
  configure_file(
    ${CMAKE_SOURCE_DIR}/resources/windows_version_resource.rc.in
    ${CMAKE_BINARY_DIR}/version.rc @ONLY
  )
  target_sources(${PROJECT_NAME} PRIVATE ${CMAKE_BINARY_DIR}/version.rc)
  source_group(Resources FILES ${CMAKE_BINARY_DIR}/version.rc)
endif()

# Find our headers
target_include_directories(
  ${PROJECT_NAME} PUBLIC $<BUILD_INTERFACE:${CMAKE_SOURCE_DIR}/include>
)
target_include_directories(
  ${PROJECT_NAME} PUBLIC $<BUILD_INTERFACE:${CMAKE_BINARY_DIR}/include>
)
target_include_directories(
  ${PROJECT_NAME} PRIVATE $<BUILD_INTERFACE:${CMAKE_SOURCE_DIR}/include/gtirb>
)
target_include_directories(
  ${PROJECT_NAME} PRIVATE $<BUILD_INTERFACE:${CMAKE_BINARY_DIR}/src/>
)

# NOTE (2020-12): tried using protobuf::libprotobuf to get relocatable exports,
# but it is apparently treated inconsistently between static and shared builds.
# For simplicity, we revert to using ${Protobuf_LIBRARIES} for now.

target_link_libraries(
  ${PROJECT_NAME}
  PUBLIC ${SYSLIBS}
         ${Boost_LIBRARIES}
         ${Protobuf_LIBRARIES}
         # Link in this static lib, but don't make it a transitive dependency of
         # TestGTIRB, etc
  PRIVATE gtirb_proto
)
target_compile_definitions(
  ${PROJECT_NAME} PRIVATE GTIRB_${PROJECT_NAME}_EXPORTS
  GTIRB_WRAP_UTILS_IN_NAMESPACE
)
target_include_directories(${PROJECT_NAME} PUBLIC "${PROTOBUF_INCLUDE_DIRS}")

if(${CMAKE_CXX_COMPILER_ID} STREQUAL MSVC)
  # These four warnings come from protobuf headers, disabling them this way
  # means that projects which link to gtirb via cmake won't have to deal with
  # them.
  target_compile_options(${PROJECT_NAME} PUBLIC -wd4100) # unreferenced formal
                                                         # parameter
  target_compile_options(
    ${PROJECT_NAME} PUBLIC -wd4127
  ) # conditional expression is constant
  target_compile_options(
    ${PROJECT_NAME} PUBLIC -wd4244
  ) # conversion from 'type1' to 'type2', possible loss of data
  target_compile_definitions(
    ${PROJECT_NAME} PUBLIC
    _SILENCE_CXX17_ITERATOR_BASE_CLASS_DEPRECATION_WARNING
  )

  target_compile_options(
    ${PROJECT_NAME} PUBLIC -wd4251
  ) # 'identifier' : class 'type' needs to have dll- interface to be used by
    # clients of class 'type2'
  target_compile_options(${PROJECT_NAME} PUBLIC -wd4275) # Non-dll interface
                                                         # base classes.
endif()

if(UNIX
   AND NOT CYGWIN
   AND ("${CMAKE_BUILD_TYPE}" STREQUAL "RelWithDebInfo" OR "${CMAKE_BUILD_TYPE}"
                                                           STREQUAL "Debug")
   AND ${GTIRB_STRIP_DEBUG_SYMBOLS}
)
  string(
    RANDOM
    LENGTH 32
    ALPHABET "abcdef0123456789" BUILD_ID
  )
  string(SUBSTRING "${BUILD_ID}" 0 2 BUILD_ID_PREFIX)
  string(SUBSTRING "${BUILD_ID}" 2 32 BUILD_ID_SUFFIX)
  target_link_libraries(${PROJECT_NAME} PRIVATE "-Wl,--build-id=0x${BUILD_ID}")
  add_custom_command(
    TARGET ${PROJECT_NAME}
    POST_BUILD
    COMMAND objcopy --only-keep-debug $<TARGET_FILE:${PROJECT_NAME}>
            ${CMAKE_BINARY_DIR}/bin/${BUILD_ID_SUFFIX}.debug
    COMMAND objcopy --strip-debug $<TARGET_FILE:${PROJECT_NAME}>
  )
  install(
    FILES "${CMAKE_BINARY_DIR}/bin/${BUILD_ID_SUFFIX}.debug"
    COMPONENT debug-file
    DESTINATION "lib/debug/.build-id/${BUILD_ID_PREFIX}"
  )
endif()

if(CLANG_TIDY_EXE)
  set_target_properties(
    ${PROJECT_NAME} PROPERTIES CXX_CLANG_TIDY "${CLANG_TIDY_EXE}"
  )
endif()

if(GTIRB_ENABLE_TESTS)
  add_subdirectory(test)
endif()

install(
  TARGETS ${PROJECT_NAME}
  COMPONENT library
  EXPORT gtirbTargets
  INCLUDES
  DESTINATION include
  RUNTIME DESTINATION bin
  LIBRARY DESTINATION lib
  ARCHIVE DESTINATION lib
)
install(
  FILES ${${PROJECT_NAME}_H}
  COMPONENT headers
  DESTINATION include/gtirb
)
install(
  DIRECTORY "${CMAKE_BINARY_DIR}/include/gtirb/proto"
  COMPONENT headers
  DESTINATION include/gtirb
)
install(
  FILES "${CMAKE_BINARY_DIR}/include/gtirb/version.h"
  COMPONENT headers
  DESTINATION include/gtirb
)


================================================
FILE: src/CodeBlock.cpp
================================================
//===- CodeBlock.cpp --------------------------------------------*- C++ -*-===//
//
//  Copyright (C) 2020 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
#include "IR.hpp"
#include "Serialization.hpp"
#include <gtirb/ByteInterval.hpp>
#include <gtirb/CodeBlock.hpp>
#include <gtirb/proto/CodeBlock.pb.h>

using namespace gtirb;

void CodeBlock::toProtobuf(MessageType* Message) const {
  nodeUUIDToBytes(this, *Message->mutable_uuid());
  Message->set_size(this->Size);
  Message->set_decode_mode(static_cast<proto::DecodeMode>(this->DecodeMode));
}

ErrorOr<CodeBlock*> CodeBlock::fromProtobuf(Context& C,
                                            const MessageType& Message) {
  // Because we do not have an offset, we cannot create the code block and
  // set its parent at the same time.
  UUID Id;
  if (!uuidFromBytes(Message.uuid(), Id))
    return {IR::load_error::BadUUID, "Cannot load code block"};

  return CodeBlock::Create(
      C, Message.size(), static_cast<gtirb::DecodeMode>(Message.decode_mode()),
      Id);
}

uint64_t CodeBlock::getOffset() const {
  assert(Parent &&
         "invalid call to CodeBlock::getOffset: Parent must not be null!");
  return Parent->nodeToBlock(this).getOffset();
}

std::optional<Addr> CodeBlock::getAddress() const {
  if (!Parent) {
    return std::nullopt;
  }
  if (auto BaseAddr = Parent->getAddress()) {
    return *BaseAddr + getOffset();
  }
  return std::nullopt;
}

// Present for testing purposes only.
void CodeBlock::save(std::ostream& Out) const {
  MessageType Message;
  this->toProtobuf(&Message);
  Message.SerializeToOstream(&Out);
}

// Present for testing purposes only.
CodeBlock* CodeBlock::load(Context& C, std::istream& In) {
  MessageType Message;
  Message.ParseFromIstream(&In);
  auto CB = CodeBlock::fromProtobuf(C, Message);
  if (CB)
    return *CB;
  return nullptr;
}


================================================
FILE: src/Context.cpp
================================================
//===- Context.cpp ----------------------------------------------*- C++ -*-===//
//
//  Copyright (C) 2020 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
#include "Context.hpp"
#include <gtirb/ByteInterval.hpp>
#include <gtirb/CodeBlock.hpp>
#include <gtirb/DataBlock.hpp>
#include <gtirb/IR.hpp>
#include <gtirb/Module.hpp>
#include <gtirb/Node.hpp>
#include <gtirb/ProxyBlock.hpp>
#include <gtirb/Section.hpp>
#include <gtirb/Symbol.hpp>

using namespace gtirb;

// By moving these declarations here, we avoid instantiating the default
// ctor/dtor in other compilation units which include Context.hpp, where some
// of the Node types may be incomplete.
Context::Context() = default;
Context::~Context() = default;

void Context::unregisterNode(const Node* N) { UuidMap.erase(N->getUUID()); }

void Context::ForgetAllocations() {
  NodeAllocator.ForgetAllocations();
  CodeBlockAllocator.ForgetAllocations();
  ByteIntervalAllocator.ForgetAllocations();
  DataBlockAllocator.ForgetAllocations();
  IrAllocator.ForgetAllocations();
  ModuleAllocator.ForgetAllocations();
  ProxyBlockAllocator.ForgetAllocations();
  SectionAllocator.ForgetAllocations();
  SymbolAllocator.ForgetAllocations();
}

const Node* Context::findNode(const UUID& ID) const {
  auto Iter = UuidMap.find(ID);
  return Iter != UuidMap.end() ? Iter->second : nullptr;
}

Node* Context::findNode(const UUID& ID) {
  auto Iter = UuidMap.find(ID);
  return Iter != UuidMap.end() ? Iter->second : nullptr;
}

template <> void* Context::Allocate<Node>() const {
  return NodeAllocator.Allocate();
}
template <> void* Context::Allocate<CodeBlock>() const {
  return CodeBlockAllocator.Allocate();
}
template <> void* Context::Allocate<ByteInterval>() const {
  return ByteIntervalAllocator.Allocate();
}
template <> void* Context::Allocate<DataBlock>() const {
  return DataBlockAllocator.Allocate();
}
template <> void* Context::Allocate<IR>() const {
  return IrAllocator.Allocate();
}
template <> void* Context::Allocate<Module>() const {
  return ModuleAllocator.Allocate();
}
template <> void* Context::Allocate<ProxyBlock>() const {
  return ProxyBlockAllocator.Allocate();
}
template <> void* Context::Allocate<Section>() const {
  return SectionAllocator.Allocate();
}
template <> void* Context::Allocate<Symbol>() const {
  return SymbolAllocator.Allocate();
}


================================================
FILE: src/DataBlock.cpp
================================================
//===- DataBlock.cpp -------------------------------------------*- C++ -*-===//
//
//  Copyright (C) 2020 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
#include "IR.hpp"
#include "Serialization.hpp"
#include <gtirb/ByteInterval.hpp>
#include <gtirb/DataBlock.hpp>
#include <gtirb/proto/DataBlock.pb.h>

using namespace gtirb;

void DataBlock::toProtobuf(MessageType* Message) const {
  nodeUUIDToBytes(this, *Message->mutable_uuid());
  Message->set_size(this->Size);
}

ErrorOr<DataBlock*> DataBlock::fromProtobuf(Context& C,
                                            const MessageType& Message) {
  UUID Id;
  if (!uuidFromBytes(Message.uuid(), Id))
    return {IR::load_error::BadUUID, "Cannot load DataBlock"};

  // Because we do not have an offset, we cannot create the data block and
  // set its parent at the same time.
  return DataBlock::Create(C, Message.size(), Id);
}

uint64_t DataBlock::getOffset() const {
  assert(Parent &&
         "invalid call to DataBlock::getOffset: Parent must not be null!");
  return Parent->nodeToBlock(this).getOffset();
}

std::optional<Addr> DataBlock::getAddress() const {
  if (!Parent) {
    return std::nullopt;
  }
  if (auto BaseAddr = Parent->getAddress()) {
    return *BaseAddr + getOffset();
  }
  return std::nullopt;
}

// Present for testing purposes only.
void DataBlock::save(std::ostream& Out) const {
  MessageType Message;
  this->toProtobuf(&Message);
  Message.SerializeToOstream(&Out);
}

// Present for testing purposes only.
DataBlock* DataBlock::load(Context& C, std::istream& In) {
  MessageType Message;
  Message.ParseFromIstream(&In);
  auto DB = DataBlock::fromProtobuf(C, Message);
  if (DB)
    return *DB;
  return nullptr;
}


================================================
FILE: src/ErrorOr.cpp
================================================
#include <ErrorOr.hpp>
#include <sstream>

namespace gtirb {

std::string ErrorInfo::message() const {
  std::stringstream Stream;
  Stream << *this;
  return Stream.str();
}

} // namespace gtirb


================================================
FILE: src/IR.cpp
================================================
//===- IR.cpp ---------------------------------------------------*- C++ -*-===//
//
//  Copyright (C) 2020 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
#include "CFGSerialization.hpp"
#include "Serialization.hpp"
#include <gtirb/DataBlock.hpp>
#include <gtirb/IR.hpp>
#include <gtirb/Module.hpp>
#include <gtirb/Section.hpp>
#include <gtirb/Symbol.hpp>
#include <gtirb/SymbolicExpression.hpp>
#include <gtirb/proto/IR.pb.h>
#include <google/protobuf/io/coded_stream.h>
#include <google/protobuf/io/zero_copy_stream_impl.h>
#include <google/protobuf/util/json_util.h>
#include <iostream>
#include <memory>

using namespace gtirb;

static constexpr const char* GTIRB_MAGIC_CHARS = "GTIRB";

class IR::ModuleObserverImpl : public ModuleObserver {
public:
  explicit ModuleObserverImpl(IR* I_) : I(I_) {}

  ChangeStatus nameChange(Module* M, const std::string& /*OldName*/,
                          const std::string& /*NewName*/) override {
    auto& Index = I->Modules.get<by_pointer>();
    auto It = Index.find(M);
    assert(It != Index.end() && "module observed by non-owner");
    // The lambda would ordinarily update the Module such that the result
    // of Module::getName changes. Because that change happened before this
    // method was called, the lambda doesn't need to do anything.
    Index.modify(It, [](Module*) {});
    return ChangeStatus::Accepted;
  }

  ChangeStatus addProxyBlocks(Module* /*M*/,
                              Module::proxy_block_range Blocks) override {
    ChangeStatus Status = ChangeStatus::NoChange;
    if (!Blocks.empty()) {
      for (ProxyBlock& PB : Blocks) {
        // User could have called addVertex themselves, so check whether we
        // actually modified the graph.
        if (addVertex(&PB, I->Cfg).second)
          Status = ChangeStatus::Accepted;
      }
    }
    return Status;
  }

  ChangeStatus removeProxyBlocks(Module* /*M*/,
                                 Module::proxy_block_range Blocks) override {
    ChangeStatus Status = ChangeStatus::NoChange;
    if (!Blocks.empty()) {
      for (ProxyBlock& PB : Blocks) {
        // User could have called removeVertex themselves, so check whether
        // we actually modified the graph.
        if (removeVertex(&PB, I->Cfg))
          Status = ChangeStatus::Accepted;
      }
    }
    return Status;
  }

  ChangeStatus addCodeBlocks(Module* /*M*/,
                             Module::code_block_range Blocks) override {
    ChangeStatus Status = ChangeStatus::NoChange;
    if (!Blocks.empty()) {
      for (CodeBlock& CB : Blocks) {
        // User could have called addVertex themselves, so check whether we
        // actually modified the graph.
        if (addVertex(&CB, I->Cfg).second)
          Status = ChangeStatus::Accepted;
      }
    }
    return Status;
  }

  ChangeStatus removeCodeBlocks(Module* /*M*/,
                                Module::code_block_range Blocks) override {
    ChangeStatus Status = ChangeStatus::NoChange;
    if (!Blocks.empty()) {
      for (CodeBlock& CB : Blocks) {
        // User could have called removeVertex themselves, so check whether
        // we actually modified the graph.
        if (removeVertex(&CB, I->Cfg))
          Status = ChangeStatus::Accepted;
      }
    }
    return Status;
  }

private:
  IR* I;
};

IR::IR(Context& C)
    : AuxDataContainer(C, Kind::IR),
      MO(std::make_unique<ModuleObserverImpl>(this)) {}

IR::IR(Context& C, const UUID& U)
    : AuxDataContainer(C, Kind::IR, U),
      MO(std::make_unique<ModuleObserverImpl>(this)) {}

class IRLoadErrorCategory : public std::error_category {
public:
  [[nodiscard]] const char* name() const noexcept override {
    return "gt.gtirb.ir";
  }
  [[nodiscard]] std::string message(int Condition) const override {
    switch (static_cast<IR::load_error>(Condition)) {
    case IR::load_error::IncorrectVersion:
      return "Incompatible protobuf version";
    case IR::load_error::CorruptFile:
      return "Corrupted GTIRB file";
    case IR::load_error::CorruptModule:
      return "Corrupted GTIRB module";
    case IR::load_error::CorruptSection:
      return "Corrupted GTIRB section";
    case IR::load_error::CorruptByteInterval:
      return "Corrupted byte interval";
    case IR::load_error::CorruptCFG:
      return "Error in parsing CFG";
    case IR::load_error::BadUUID:
      return "Bytes not valid UUID";
    case IR::load_error::MissingUUID:
      return "Could not locate UUID";
    case IR::load_error::NotGTIRB:
      return "File does not contain GTIRB";
    }
    assert(false && "Expected to handle all error codes");
    return "";
  }
};

const std::error_category& gtirb::loadErrorCategory() {
  static IRLoadErrorCategory Cat;
  return Cat;
}

void IR::toProtobuf(MessageType* Message) const {
  nodeUUIDToBytes(this, *Message->mutable_uuid());
  *Message->mutable_cfg() = gtirb::toProtobuf(this->Cfg);
  containerToProtobuf(this->Modules, Message->mutable_modules());
  AuxDataContainer::toProtobuf(Message);
  Message->set_version(Version);
}

ErrorOr<IR*> IR::fromProtobuf(Context& C, const MessageType& Message) {
  UUID Id;
  if (!uuidFromBytes(Message.uuid(), Id))
    return {load_error::CorruptFile, "Cannot load IR"};

  auto* I = IR::Create(C, Id);
  int i = 0;
  for (const auto& Elt : Message.modules()) {
    auto M = Module::fromProtobuf(C, Elt);
    if (!M) {
      ErrorInfo Err{load_error::CorruptModule, "#" + std::to_string(i)};
      Err.Msg += "\n" + M.getError().message();
      return Err;
    }
    I->addModule(*M);
    ++i;
  }
  if (!gtirb::fromProtobuf(C, I->Cfg, Message.cfg()))
    return load_error::CorruptCFG;
  static_cast<AuxDataContainer*>(I)->fromProtobuf(Message);
  I->Version = Message.version();

  if (I->Version != GTIRB_PROTOBUF_VERSION) {
    std::stringstream ss;
    ss << I->Version << "; expected version " << GTIRB_PROTOBUF_VERSION;
    return {load_error::IncorrectVersion, ss.str()};
  }
  return I;
}

void IR::save(std::ostream& Out) const {
  // Magic signature
  // Magic signature
  // Bytes 0-4 contain the ASCII characters: GTIRB.
  // Bytes 5-6 are considered reserved for future use and should be 0.
  // Byte 7 contains the GTIRB protobuf spec version in use.
  Out << GTIRB_MAGIC_CHARS << static_cast<uint8_t>(0) << static_cast<uint8_t>(0)
      << static_cast<uint8_t>(GTIRB_PROTOBUF_VERSION);

  // Protobuf
  MessageType Message;
  this->toProtobuf(&Message);
  Message.SerializeToOstream(&Out);
}

ErrorOr<IR*> IR::load(Context& C, std::istream& In) {
  constexpr size_t magic_len =
      std::string::traits_type::length(GTIRB_MAGIC_CHARS);
  std::array<char, magic_len> magic;
  In.read(magic.data(), magic_len);
  if (memcmp(magic.data(), GTIRB_MAGIC_CHARS, magic_len) != 0) {
    return {load_error::NotGTIRB, "GTIRB magic signature not found"};
  }

  uint8_t res0;
  In >> res0;

  uint8_t res1;
  In >> res1;

  uint8_t protobuf_version;
  In >> protobuf_version;
  if (protobuf_version != GTIRB_PROTOBUF_VERSION) {
    std::stringstream ss;
    ss << "GTIRB protobuf version mismatch. Expected: "
       << GTIRB_PROTOBUF_VERSION << " Saw: " << protobuf_version;
    return {load_error::IncorrectVersion, ss.str()};
  }

  google::protobuf::io::IstreamInputStream InputStream(&In);
  google::protobuf::io::CodedInputStream CodedStream(&InputStream);
#ifdef PROTOBUF_SET_BYTES_LIMIT
  CodedStream.SetTotalBytesLimit(INT_MAX, INT_MAX);
#endif

  MessageType Message;
  if (!Message.ParseFromCodedStream(&CodedStream)) {
    return {load_error::CorruptFile, "Protobuf unable to be parsed"};
  }

  return IR::fromProtobuf(C, Message);
}

void IR::saveJSON(std::ostream& Out) const {
  MessageType Message;
  this->toProtobuf(&Message);
  std::string S;
  auto status = google::protobuf::util::MessageToJsonString(Message, &S);
  assert(status.ok());
  Out << S;
}

ErrorOr<IR*> IR::loadJSON(Context& C, std::istream& In) {
  MessageType Message;
  std::string S;
  auto status = google::protobuf::util::JsonStringToMessage(
      std::string(std::istreambuf_iterator<char>(In), {}), &Message);
  if (!status.ok()) {
    return {load_error::CorruptFile, status.ToString()};
  } else {
    return IR::fromProtobuf(C, Message);
  }
}


================================================
FILE: src/Module.cpp
================================================
//===- Module.cpp -----------------------------------------------*- C++ -*-===//
//
//  Copyright (C) 2021 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
#include "Module.hpp"
#include "Serialization.hpp"
#include <gtirb/CFG.hpp>
#include <gtirb/CodeBlock.hpp>
#include <gtirb/IR.hpp>
#include <gtirb/SymbolicExpression.hpp>
#include <array>
#include <map>

using namespace gtirb;

class Module::SectionObserverImpl : public SectionObserver {
public:
  SectionObserverImpl(Module* M_) : M(M_) {}

  ChangeStatus nameChange(Section* S, const std::string& OldName,
                          const std::string& NewName) override;

  ChangeStatus addCodeBlocks(Section* S,
                             Section::code_block_range Blocks) override;

  ChangeStatus moveCodeBlocks(Section* S,
                              Section::code_block_range Blocks) override;

  ChangeStatus removeCodeBlocks(Section* S,
                                Section::code_block_range Blocks) override;

  ChangeStatus addDataBlocks(Section* S,
                             Section::data_block_range Blocks) override;

  ChangeStatus moveDataBlocks(Section* S,
                              Section::data_block_range Blocks) override;

  ChangeStatus removeDataBlocks(Section* S,
                                Section::data_block_range Blocks) override;

  ChangeStatus changeExtent(Section* S,
                            std::function<void(Section*)> Callback) override;

private:
  Module* M;
};

class Module::SymbolObserverImpl : public SymbolObserver {
public:
  explicit SymbolObserverImpl(Module* M_) : M(M_) {}

  ChangeStatus nameChange(Symbol* S, const std::string& OldName,
                          const std::string& NewName) override;

  ChangeStatus referentChange(
      Symbol* S, std::variant<std::monostate, Addr, Node*> OldReferent,
      std::variant<std::monostate, Addr, Node*> NewReferent) override;

private:
  Module* M;
};

Module::Module(Context& C, const std::string& N)
    : AuxDataContainer(C, Kind::Module), Name(N),
      SecObs(std::make_unique<SectionObserverImpl>(this)),
      SymObs(std::make_unique<SymbolObserverImpl>(this)) {}
Module::Module(Context& C, const std::string& N, const UUID& U)
    : AuxDataContainer(C, Kind::Module, U), Name(N),
      SecObs(std::make_unique<SectionObserverImpl>(this)),
      SymObs(std::make_unique<SymbolObserverImpl>(this)) {}

void Module::toProtobuf(MessageType* Message) const {
  nodeUUIDToBytes(this, *Message->mutable_uuid());
  Message->set_binary_path(this->BinaryPath);
  Message->set_preferred_addr(static_cast<uint64_t>(this->PreferredAddr));
  Message->set_rebase_delta(this->RebaseDelta);
  Message->set_file_format(static_cast<proto::FileFormat>(this->FileFormat));
  Message->set_isa(static_cast<proto::ISA>(this->Isa));
  Message->set_name(this->Name);
  sequenceToProtobuf(ProxyBlocks.begin(), ProxyBlocks.end(),
                     Message->mutable_proxies());
  sequenceToProtobuf(sections_begin(), sections_end(),
                     Message->mutable_sections());
  containerToProtobuf(Symbols, Message->mutable_symbols());
  if (EntryPoint) {
    nodeUUIDToBytes(EntryPoint, *Message->mutable_entry_point());
  }
  Message->set_byte_order(static_cast<proto::ByteOrder>(this->ByteOrder));
  AuxDataContainer::toProtobuf(Message);
}

// FIXME: improve containerFromProtobuf so it can handle a pair where one
// element is a pointer to a Node subclass.
template <class T, class U, class V, class W>
static void nodeMapFromProtobuf(Context& C, std::map<T, U*>& Values,
                                const google::protobuf::Map<V, W>& Message) {
  Values.clear();
  std::for_each(Message.begin(), Message.end(), [&Values, &C](const auto& M) {
    std::pair<T, U*> Val;
    fromProtobuf(C, Val.first, M.first);
    Val.second = U::fromProtobuf(C, M.second);
    Values.insert(std::move(Val));
  });
}

ErrorOr<Module*> Module::fromProtobuf(Context& C, const MessageType& Message) {
  UUID Id;
  if (!uuidFromBytes(Message.uuid(), Id))
    return {IR::load_error::BadUUID, "Cannot load module"};

  ErrorInfo Problem{IR::load_error::CorruptModule,
                    "Cannot load module " + Message.name()};

  Module* M = Module::Create(C, Message.name(), Id);
  M->BinaryPath = Message.binary_path();
  M->PreferredAddr = Addr(Message.preferred_addr());
  M->RebaseDelta = Message.rebase_delta();
  M->FileFormat = static_cast<gtirb::FileFormat>(Message.file_format());
  M->Isa = static_cast<ISA>(Message.isa());
  for (const auto& Elt : Message.proxies()) {
    auto PB = ProxyBlock::fromProtobuf(C, Elt);
    if (!PB) {
      Problem.Msg += "\n" + PB.getError().message();
      return Problem;
    }
    M->addProxyBlock(*PB);
  }
  for (const auto& Elt : Message.sections()) {
    auto S = Section::fromProtobuf(C, Elt);
    if (!S) {
      Problem.Msg += "\n" + S.getError().message();
      return Problem;
    }
    M->addSection(*S);
  }
  for (const auto& Elt : Message.symbols()) {
    auto S = Symbol::fromProtobuf(C, Elt);
    if (!S) {
      Problem.Msg += "\n" + S.getError().message();
      return Problem;
    }
    M->addSymbol(*S);
  }
  for (const auto& ProtoS : Message.sections()) {
    for (const auto& ProtoBI : ProtoS.byte_intervals()) {
      if (!uuidFromBytes(ProtoBI.uuid(), Id)) {
        Problem.Msg += "\nCould not parse UUID for ByteInterval in section " +
                       ProtoS.name();
        return Problem;
      }
      auto* BI = dyn_cast_or_null<ByteInterval>(getByUUID(C, Id));
      if (!BI) {
        Problem.Msg += "\nCould not find UUID for ByteInterval in section " +
                       ProtoS.name();
        return Problem;
      }
      if (!BI->symbolicExpressionsFromProtobuf(C, ProtoBI)) {
        std::stringstream msg{
            "Could not deserialize symbolic expression in ByteInterval"};
        if (auto Addr = BI->getAddress())
          msg << " @" << Addr;
        msg << "in section " << ProtoS.name();
        Problem.Msg += msg.str();
        return Problem;
      }
    }
  }

  if (!Message.entry_point().empty()) {
    if (!uuidFromBytes(Message.entry_point(), Id)) {
      Problem.Msg += "\nCould not parse UUID for entry point";
      return Problem;
    }
    M->EntryPoint = dyn_cast_or_null<CodeBlock>(Node::getByUUID(C, Id));
    if (!M->EntryPoint) {
      Problem.Msg += "\nCould not find entry point";
      return Problem;
    }
  }
  M->ByteOrder = static_cast<gtirb::ByteOrder>(Message.byte_order());
  static_cast<AuxDataContainer*>(M)->fromProtobuf(Message);
  return M;
}

ChangeStatus Module::removeProxyBlock(ProxyBlock* B) {
  if (auto It = ProxyBlocks.find(B); It != ProxyBlocks.end()) {
    if (Observer) {
      auto BlockRange = boost::make_iterator_range(It, std::next(It));
      [[maybe_unused]] ChangeStatus status =
          Observer->removeProxyBlocks(this, BlockRange);
      // The known observers do not reject removals. If that changes, this
      // method must be updated. Because addProxyBlock(ProxyBlock*) also
      // assumes removals are never rejected, that method should be updated
      // as well.
      assert(status != ChangeStatus::Rejected &&
             "recovering from rejected removal is unimplemented");
    }
    ProxyBlocks.erase(It);
    B->setModule(nullptr);
    return ChangeStatus::Accepted;
  }
  return ChangeStatus::NoChange;
}

ChangeStatus Module::addProxyBlock(ProxyBlock* B) {
  if (Module* M = B->getModule()) {
    if (M == this)
      return ChangeStatus::NoChange;
    [[maybe_unused]] ChangeStatus status = M->removeProxyBlock(B);
    assert(status != ChangeStatus::Rejected &&
           "failed to remove block from former parent");
  }

  B->setModule(this);
  auto [It, Inserted] = ProxyBlocks.insert(B);
  if (Inserted && Observer) {
    auto BlockRange = boost::make_iterator_range(It, std::next(It));
    [[maybe_unused]] ChangeStatus status =
        Observer->addProxyBlocks(this, BlockRange);
    // The known observers do not reject insertions. If that changes, this
    // method must be updated.
    assert(status != ChangeStatus::Rejected &&
           "recovering from rejected insertion is unimplemented");
  }
  return ChangeStatus::Accepted;
}

// Present for testing purposes only.
void Module::save(std::ostream& Out) const {
  MessageType Message;
  this->toProtobuf(&Message);
  Message.SerializeToOstream(&Out);
}

// Present for testing purposes only.
Module* Module::load(Context& C, std::istream& In) {
  MessageType Message;
  Message.ParseFromIstream(&In);
  auto M = Module::fromProtobuf(C, Message);
  if (M) {
    return *M;
  }
  return nullptr;
}

ChangeStatus Module::removeSection(Section* S) {
  auto& Index = Sections.get<by_pointer>();
  if (auto Iter = Index.find(S); Iter != Index.end()) {
    if (Observer) {
      auto Begin = Sections.project<by_address>(Iter);
      auto End = std::next(Begin);
      auto BlockRange = makeCodeBlockRange(Begin, End);
      [[maybe_unused]] ChangeStatus Status =
          Observer->removeCodeBlocks(this, BlockRange);
      // The known observers do not reject removals. If that changes, this
      // method must be updated. Because addSection(Section*) also assumes
      // removals are never rejected, that method should be updated as well.
      assert(Status != ChangeStatus::Rejected &&
             "recovering from rejected removal is unimplemented");
    }

    removeSectionAddrs(S);
    Index.erase(Iter);
    S->setParent(nullptr, nullptr);
    return ChangeStatus::Accepted;
  }
  return ChangeStatus::NoChange;
}

ChangeStatus Module::addSection(Section* S) {
  if (Module* M = S->getModule()) {
    if (M == this)
      return ChangeStatus::NoChange;
    [[maybe_unused]] ChangeStatus Status = M->removeSection(S);
    assert(Status != ChangeStatus::Rejected &&
           "failed to remove section from former parent");
  }

  S->setParent(this, SecObs.get());

  auto [Iter, Inserted] = Sections.emplace(S);
  if (Inserted && Observer) {
    auto BlockRange = makeCodeBlockRange(Iter, std::next(Iter));
    [[maybe_unused]] ChangeStatus Status =
        Observer->addCodeBlocks(this, BlockRange);
    // The known observers do not reject insertions. If that changes, this
    // method must be updated.
    assert(Status != ChangeStatus::Rejected &&
           "recovering from rejected insertion is unimplemented");
  }

  insertSectionAddrs(S);
  return ChangeStatus::Accepted;
}

void Module::removeSectionAddrs(Section* S) {
  if (std::optional<AddrRange> OldExtent = addressRange(*S)) {
    SectionAddrs.subtract(
        std::make_pair(SectionIntMap::interval_type::right_open(
                           OldExtent->lower(), OldExtent->upper()),
                       SectionIntMap::codomain_type({S})));
  }
}

void Module::insertSectionAddrs(Section* S) {
  if (std::optional<AddrRange> NewExtent = addressRange(*S)) {
    SectionAddrs.add(std::make_pair(SectionIntMap::interval_type::right_open(
                                        NewExtent->lower(), NewExtent->upper()),
                                    SectionIntMap::codomain_type({S})));
  }
}

static auto NoOp = [](auto*) {};

ChangeStatus
Module::SectionObserverImpl::nameChange(Section* S,
                                        const std::string& /*OldName*/,
                                        const std::string& /*NewName*/) {
  auto& Index = M->Sections.get<by_pointer>();
  auto It = Index.find(S);
  assert(It != Index.end() && "section observed by non-owner");
  // The following lambda is intentionally a no-op. Because the Section's name
  // has already been updated before this method executes, we only need to tell
  // the index to re-synchronize.
  Index.modify(It, NoOp);
  return ChangeStatus::Accepted;
}

ChangeStatus
Module::SectionObserverImpl::addCodeBlocks([[maybe_unused]] Section* S,
                                           Section::code_block_range Blocks) {
  ChangeStatus Status = ChangeStatus::NoChange;
  if (M->Observer) {
    [[maybe_unused]] auto& SectionIndex = M->Sections.get<by_pointer>();
    assert(SectionIndex.find(S) != SectionIndex.end() &&
           "section observed by non-owner");
    // code_block_iterator takes a range of ranges, so wrap the given block
    // range in a one-element array.
    std::array<decltype(Blocks), 1> Range{Blocks};
    Status = M->Observer->addCodeBlocks(
        M, boost::make_iterator_range(code_block_iterator(Range),
                                      code_block_iterator()));
    assert(Status != ChangeStatus::Rejected &&
           "recovering from rejected insertion is not implemented");
  }

  if (moveCodeBlocks(S, Blocks) == ChangeStatus::Accepted)
    return ChangeStatus::Accepted;
  return Status;
}

ChangeStatus
Module::SectionObserverImpl::moveCodeBlocks([[maybe_unused]] Section* S,
                                            Section::code_block_range Blocks) {
  ChangeStatus Status = ChangeStatus::NoChange;
  auto& Index = M->Symbols.get<by_referent>();

  // Remove the affected symbols from M->Symbols and reinsert them. We cannot
  // simply call modify() because the by_address index may be arbitrarily
  // corrupt when this method is called. If we try to modify a symbol that
  // happens to be in the correct position relative to its neighbors, that
  // symbol will not be updated even if the neighbors are not in their correct
  // positions.

  std::vector<Symbol*> ModifiedSymbols;
  for (CodeBlock& Block : Blocks) {
    for (auto [It, End] = Index.equal_range(&Block); It != End;) {
      ModifiedSymbols.push_back(*It);
      It = Index.erase(It);
      Status = ChangeStatus::Accepted;
    }
  }
  M->Symbols.insert(ModifiedSymbols.begin(), ModifiedSymbols.end());

  return Status;
}

ChangeStatus Module::SectionObserverImpl::removeCodeBlocks(
    [[maybe_unused]] Section* S, Section::code_block_range Blocks) {
  ChangeStatus Status = ChangeStatus::NoChange;
  if (M->Observer) {
    [[maybe_unused]] auto& SectionIndex = M->Sections.get<by_pointer>();
    assert(SectionIndex.find(S) != SectionIndex.end() &&
           "section observed by non-owner");
    // code_block_iterator takes a range of ranges, so wrap the given block
    // range in a one-element array.
    std::array<decltype(Blocks), 1> Range{Blocks};
    Status = M->Observer->removeCodeBlocks(
        M, boost::make_iterator_range(code_block_iterator(Range),
                                      code_block_iterator()));
    assert(Status != ChangeStatus::Rejected &&
           "recovering from failed removal is not implemented");
  }

  if (moveCodeBlocks(S, Blocks) == ChangeStatus::Accepted)
    return ChangeStatus::Accepted;
  return Status;
}

ChangeStatus
Module::SectionObserverImpl::addDataBlocks(Section* S,
                                           Section::data_block_range Blocks) {
  return moveDataBlocks(S, Blocks);
}

ChangeStatus
Module::SectionObserverImpl::moveDataBlocks(Section* /* S */,
                                            Section::data_block_range Blocks) {
  ChangeStatus Status = ChangeStatus::NoChange;
  auto& Index = M->Symbols.get<by_referent>();

  // Remove the affected symbols from M->Symbols and reinsert them. We cannot
  // simply call modify() because the by_address index may be arbitrarily
  // corrupt when this method is called. If we try to modify a symbol that
  // happens to be in the correct position relative to its neighbors, that
  // symbol will not be updated even if the neighbors are not in their correct
  // positions.

  std::vector<Symbol*> ModifiedSymbols;
  for (DataBlock& Block : Blocks) {
    for (auto [It, End] = Index.equal_range(&Block); It != End;) {
      ModifiedSymbols.push_back(*It);
      It = Index.erase(It);
      Status = ChangeStatus::Accepted;
    }
  }
  M->Symbols.insert(ModifiedSymbols.begin(), ModifiedSymbols.end());

  return Status;
}

ChangeStatus Module::SectionObserverImpl::removeDataBlocks(
    Section* S, Section::data_block_range Blocks) {
  return moveDataBlocks(S, Blocks);
}

ChangeStatus Module::SectionObserverImpl::changeExtent(
    Section* S, std::function<void(Section*)> Callback) {
  auto& Index = M->Sections.get<by_pointer>();
  if (auto It = Index.find(S); It != Index.end()) {
    M->removeSectionAddrs(S);
    Index.modify(It, Callback);
    M->insertSectionAddrs(S);
  }
  return ChangeStatus::NoChange;
}

ChangeStatus Module::SymbolObserverImpl::nameChange(Symbol* S,
                                                    const std::string&,
                                                    const std::string&) {
  auto& Index = M->Symbols.get<by_pointer>();
  auto It = Index.find(S);
  assert(It != Index.end() && "symbol observed by non-owner");
  // The following lambda is intentionally a no-op. Because the Symbol's name
  // has already been updated before this method executes, we only need to tell
  // the index to re-synchronize.
  Index.modify(It, NoOp);
  return ChangeStatus::Accepted;
}

ChangeStatus Module::SymbolObserverImpl::referentChange(
    Symbol* S, std::variant<std::monostate, Addr, Node*>,
    std::variant<std::monostate, Addr, Node*>) {
  auto& Index = M->Symbols.get<by_pointer>();
  auto It = Index.find(S);
  assert(It != Index.end() && "symbol observed by non-owner");
  // The following lambda is intentionally a no-op. Because the Symbol's
  // referent or address has already been updated before this method executes,
  // we only need to tell the index to re-synchronize.
  Index.modify(It, NoOp);
  return ChangeStatus::Accepted;
}


================================================
FILE: src/Node.cpp
================================================
//===- Node.cpp -------------------------------------------------*- C++ -*-===//
//
//  Copyright (C) 2020 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
#include "Node.hpp"
#include "gtirb/Module.hpp"
#include <boost/uuid/uuid_generators.hpp>

using namespace gtirb;

// TODO: accessing this object between threads requires synchronization.
static boost::uuids::random_generator UUIDGenerator;

Node::Node(Context& C, Kind Knd, const UUID& U) : K(Knd), Uuid(U), Ctx(&C) {
  Ctx->registerNode(Uuid, this);
}

Node::Node(Context& C, Kind Knd) : Node(C, Knd, UUIDGenerator()) {}

Node::~Node() noexcept { Ctx->unregisterNode(this); }


================================================
FILE: src/Offset.cpp
================================================
//===- Offset.cpp -----------------------------------------------*- C++ -*-===//
//
//  Copyright (C) 2020 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
#include "Serialization.hpp"
#include <gtirb/Offset.hpp>
#include <gtirb/proto/Offset.pb.h>

using namespace gtirb;

void Offset::toProtobuf(MessageType* Message) const {
  uuidToBytes(this->ElementId, *Message->mutable_element_id());
  Message->set_displacement(this->Displacement);
}

bool Offset::fromProtobuf(Context&, const MessageType& Message) {
  if (!uuidFromBytes(Message.element_id(), this->ElementId))
    return false;
  this->Displacement = Message.displacement();
  return true;
}


================================================
FILE: src/ProxyBlock.cpp
================================================
//===- ProxyBlock.cpp -------------------------------------------*- C++ -*-===//
//
//  Copyright (C) 2020 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
#include "ProxyBlock.hpp"
#include "IR.hpp"
#include "Serialization.hpp"
#include <gtirb/proto/ProxyBlock.pb.h>

using namespace gtirb;

void ProxyBlock::toProtobuf(MessageType* Message) const {
  nodeUUIDToBytes(this, *Message->mutable_uuid());
}

ErrorOr<ProxyBlock*> ProxyBlock::fromProtobuf(Context& C,
                                              const MessageType& Message) {
  UUID Id;
  if (!uuidFromBytes(Message.uuid(), Id))
    return {IR::load_error::BadUUID, "Could not create proxy block"};

  return Create(C, Id);
}

// Present for testing purposes only.
void ProxyBlock::save(std::ostream& Out) const {
  MessageType Message;
  this->toProtobuf(&Message);
  Message.SerializeToOstream(&Out);
}

// Present for testing purposes only.
ProxyBlock* ProxyBlock::load(Context& C, std::istream& In) {
  MessageType Message;
  Message.ParseFromIstream(&In);
  auto CB = ProxyBlock::fromProtobuf(C, Message);
  if (CB)
    return *CB;
  return nullptr;
}


================================================
FILE: src/Section.cpp
================================================
//===- Section.cpp ----------------------------------------------*- C++ -*-===//
//
//  Copyright (C) 2020 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
#include "Section.hpp"
#include "IR.hpp"
#include "Serialization.hpp"

using namespace gtirb;

class Section::ByteIntervalObserverImpl : public ByteIntervalObserver {
public:
  ByteIntervalObserverImpl(Section* S_) : S(S_) {}

  ChangeStatus addCodeBlocks(ByteInterval* BI,
                             ByteInterval::code_block_range Blocks) override;

  ChangeStatus moveCodeBlocks(ByteInterval* BI,
                              ByteInterval::code_block_range Blocks) override;

  ChangeStatus removeCodeBlocks(ByteInterval* BI,
                                ByteInterval::code_block_range Blocks) override;

  ChangeStatus addDataBlocks(ByteInterval* BI,
                             ByteInterval::data_block_range Blocks) override;

  ChangeStatus moveDataBlocks(ByteInterval* BI,
                              ByteInterval::data_block_range Blocks) override;

  ChangeStatus removeDataBlocks(ByteInterval* BI,
                                ByteInterval::data_block_range Blocks) override;

  ChangeStatus
  changeExtent(ByteInterval* BI,
               std::function<void(ByteInterval*)> Callback) override;

private:
  Section* S;
};

Section::Section(Context& C) : Section(C, std::string{}) {}

Section::Section(Context& C, const std::string& N)
    : Node(C, Kind::Section), Name(N),
      BIO(std::make_unique<ByteIntervalObserverImpl>(this)) {}

Section::Section(Context& C, const std::string& N, const UUID& U)
    : Node(C, Kind::Section, U), Name(N),
      BIO(std::make_unique<ByteIntervalObserverImpl>(this)) {}

bool Section::operator==(const Section& Other) const {
  return this->getAddress() == Other.getAddress() &&
         this->getSize() == Other.getSize() && this->Name == Other.Name;
}

bool Section::operator!=(const Section& Other) const {
  return !(*this == Other);
}

void Section::toProtobuf(MessageType* Message) const {
  nodeUUIDToBytes(this, *Message->mutable_uuid());
  Message->set_name(this->Name);
  for (auto Flag : flags()) {
    Message->add_section_flags(static_cast<proto::SectionFlag>(Flag));
  }
  for (const auto& Interval : byte_intervals()) {
    Interval.toProtobuf(Message->add_byte_intervals());
  }
}

ErrorOr<Section*> Section::fromProtobuf(Context& C,
                                        const MessageType& Message) {
  UUID Id;
  if (!uuidFromBytes(Message.uuid(), Id))
    return {IR::load_error::BadUUID, "Could not load section"};

  auto* S = Section::Create(C, Message.name(), Id);
  for (int I = 0, E = Message.section_flags_size(); I != E; ++I) {
    S->addFlag(static_cast<SectionFlag>(Message.section_flags(I)));
  }
  for (const auto& ProtoInterval : Message.byte_intervals()) {
    auto BI = ByteInterval::fromProtobuf(C, ProtoInterval);
    if (!BI) {
      ErrorInfo err{IR::load_error::CorruptSection,
                    "Could not load section" + Message.name() + "\n" +
                        BI.getError().message()};
      return err;
    }
    S->addByteInterval(*BI);
  }
  return S;
}

// Present for testing purposes only.
void Section::save(std::ostream& Out) const {
  MessageType Message;
  this->toProtobuf(&Message);
  Message.SerializeToOstream(&Out);
}

// Present for testing purposes only.
Section* Section::load(Context& C, std::istream& In) {
  MessageType Message;
  Message.ParseFromIstream(&In);
  auto S = Section::fromProtobuf(C, Message);
  if (S)
    return *S;
  return nullptr;
}

ChangeStatus Section::removeByteInterval(ByteInterval* BI) {
  auto& Index = ByteIntervals.get<by_pointer>();
  if (auto Iter = Index.find(BI); Iter != Index.end()) {
    if (Observer) {
      auto Begin = ByteIntervals.project<by_address>(Iter);
      auto End = std::next(Begin);
      [[maybe_unused]] ChangeStatus Status =
          Observer->removeCodeBlocks(this, makeCodeBlockRange(Begin, End));
      // None of the known observers reject removals. If that changes, this
      // implementation will need to be changed as well. Because
      // addByteInterval assumes that removal will not be rejected, it will
      // need to be updated.
      assert(Status != ChangeStatus::Rejected &&
             "recovering from rejected removal is not implemented yet");
    }

    removeByteIntervalAddrs(BI);
    Index.erase(Iter);
    BI->setParent(nullptr, nullptr);
    [[maybe_unused]] ChangeStatus Status = updateExtent();
    assert(Status != ChangeStatus::Rejected &&
           "failed to change Section extent after removing ByteInterval");
    return ChangeStatus::Accepted;
  }
  return ChangeStatus::NoChange;
}

ChangeStatus Section::addByteInterval(ByteInterval* BI) {
  if (Section* S = BI->getSection()) {
    if (S == this) {
      return ChangeStatus::NoChange;
    }
    [[maybe_unused]] ChangeStatus Status = S->removeByteInterval(BI);
    assert(Status != ChangeStatus::Rejected &&
           "failed to remove node from parent");
  }

  BI->setParent(this, BIO.get());
  auto P = ByteIntervals.emplace(BI);
  if (P.second && Observer) {
    auto Blocks = makeCodeBlockRange(P.first, std::next(P.first));
    [[maybe_unused]] ChangeStatus Status =
        Observer->addCodeBlocks(this, Blocks);
    // None of the known observers reject insertions. If that changes, this
    // implementation must be updated.
    assert(Status != ChangeStatus::Rejected &&
           "recovering from rejected insertion is unimplemented");
  }

  insertByteIntervalAddrs(BI);
  [[maybe_unused]] ChangeStatus Status = updateExtent();
  assert(Status != ChangeStatus::Rejected &&
         "failed to change Section extent after adding ByteInterval");
  return ChangeStatus::Accepted;
}

void Section::removeByteIntervalAddrs(ByteInterval* BI) {
  if (std::optional<AddrRange> OldExtent = addressRange(*BI)) {
    ByteIntervalAddrs.subtract(
        std::make_pair(ByteIntervalIntMap::interval_type::right_open(
                           OldExtent->lower(), OldExtent->upper()),
                       ByteIntervalIntMap::codomain_type({BI})));
  }
}

void Section::insertByteIntervalAddrs(ByteInterval* BI) {
  if (std::optional<AddrRange> NewExtent = addressRange(*BI)) {
    ByteIntervalAddrs.add(
        std::make_pair(ByteIntervalIntMap::interval_type::right_open(
                           NewExtent->lower(), NewExtent->upper()),
                       ByteIntervalIntMap::codomain_type({BI})));
  }
}

ChangeStatus Section::updateExtent() {
  std::optional<AddrRange> NewExtent;
  if (!ByteIntervals.empty()) {
    // Any ByteIntervals without an address will be at the front of the map
    // because nullopt sorts lower than any address.
    if (std::optional<Addr> Lower = (*ByteIntervals.begin())->getAddress()) {
      // All the ByteIntervals have an address, so we can calculate the
      // Section's extent. Get the address of the last ByteInterval in case it
      // has zero size; ByteIntervalAddrs does not track empty ByteIntervals.
      Addr Upper = *(*ByteIntervals.rbegin())->getAddress();
      if (!ByteIntervalAddrs.empty()) {
        // The last address is the max of the first address in the last
        // interval and the last address in intervals with non-zero size.
        Upper = std::max(Upper, ByteIntervalAddrs.rbegin()->first.upper());
      }
      NewExtent = AddrRange{*Lower, static_cast<uint64_t>(Upper - *Lower)};
    }
  }

  if (NewExtent != Extent) {
    if (Observer) {
      [[maybe_unused]] ChangeStatus Status = Observer->changeExtent(
          this, [&NewExtent](Section* S) { S->Extent = NewExtent; });
      assert(Status != ChangeStatus::Rejected &&
             "recovering from rejected extent changes is unimplemented");
    } else {
      Extent = NewExtent;
    }
    return ChangeStatus::Accepted;
  }
  return ChangeStatus::NoChange;
}

ChangeStatus Section::ByteIntervalObserverImpl::addCodeBlocks(
    [[maybe_unused]] ByteInterval* BI, ByteInterval::code_block_range Blocks) {
  if (S->Observer) {
    [[maybe_unused]] auto& Index = S->ByteIntervals.get<by_pointer>();
    assert(Index.find(BI) != Index.end() &&
           "byte interval observed by non-owner");
    // code_block_iterator takes a range of ranges, so wrap the given block
    // range in a one-element array.
    std::array<decltype(Blocks), 1> Range{Blocks};
    return S->Observer->addCodeBlocks(
        S, boost::make_iterator_range(code_block_iterator(Range),
                                      code_block_iterator()));
  }
  return ChangeStatus::NoChange;
}

ChangeStatus Section::ByteIntervalObserverImpl::moveCodeBlocks(
    [[maybe_unused]] ByteInterval* BI, ByteInterval::code_block_range Blocks) {
  if (S->Observer) {
    [[maybe_unused]] auto& Index = S->ByteIntervals.get<by_pointer>();
    assert(Index.find(BI) != Index.end() &&
           "byte interval observed by non-owner");
    // code_block_iterator takes a range of ranges, so wrap the given block
    // range in a one-element array.
    std::array<decltype(Blocks), 1> Range{Blocks};
    return S->Observer->moveCodeBlocks(
        S, boost::make_iterator_range(code_block_iterator(Range),
                                      code_block_iterator()));
  }
  return ChangeStatus::NoChange;
}

ChangeStatus Section::ByteIntervalObserverImpl::removeCodeBlocks(
    [[maybe_unused]] ByteInterval* BI, ByteInterval::code_block_range Blocks) {
  if (S->Observer) {
    [[maybe_unused]] auto& Index = S->ByteIntervals.get<by_pointer>();
    assert(Index.find(BI) != Index.end() &&
           "byte interval observed by non-owner");
    // code_block_iterator takes a range of ranges, so wrap the given block
    // range in a one-element array.
    std::array<decltype(Blocks), 1> Range{Blocks};
    return S->Observer->removeCodeBlocks(
        S, boost::make_iterator_range(code_block_iterator(Range),
                                      code_block_iterator()));
  }
  return ChangeStatus::NoChange;
}

ChangeStatus Section::ByteIntervalObserverImpl::addDataBlocks(
    [[maybe_unused]] ByteInterval* BI, ByteInterval::data_block_range Blocks) {
  if (S->Observer) {
    [[maybe_unused]] auto& Index = S->ByteIntervals.get<by_pointer>();
    assert(Index.find(BI) != Index.end() &&
           "byte interval observed by non-owner");
    // data_block_iterator takes a range of ranges, so wrap the given block
    // range in a one-element array.
    std::array<decltype(Blocks), 1> Range{Blocks};
    return S->Observer->addDataBlocks(
        S, boost::make_iterator_range(data_block_iterator(Range),
                                      data_block_iterator()));
  }
  return ChangeStatus::NoChange;
}

ChangeStatus Section::ByteIntervalObserverImpl::moveDataBlocks(
    [[maybe_unused]] ByteInterval* BI, ByteInterval::data_block_range Blocks) {
  if (S->Observer) {
    [[maybe_unused]] auto& Index = S->ByteIntervals.get<by_pointer>();
    assert(Index.find(BI) != Index.end() &&
           "byte interval observed by non-owner");
    // data_block_iterator takes a range of ranges, so wrap the given block
    // range in a one-element array.
    std::array<decltype(Blocks), 1> Range{Blocks};
    return S->Observer->moveDataBlocks(
        S, boost::make_iterator_range(data_block_iterator(Range),
                                      data_block_iterator()));
  }
  return ChangeStatus::NoChange;
}

ChangeStatus Section::ByteIntervalObserverImpl::removeDataBlocks(
    [[maybe_unused]] ByteInterval* BI, ByteInterval::data_block_range Blocks) {
  if (S->Observer) {
    [[maybe_unused]] auto& Index = S->ByteIntervals.get<by_pointer>();
    assert(Index.find(BI) != Index.end() &&
           "byte interval observed by non-owner");
    // data_block_iterator takes a range of ranges, so wrap the given block
    // range in a one-element array.
    std::array<decltype(Blocks), 1> Range{Blocks};
    return S->Observer->removeDataBlocks(
        S, boost::make_iterator_range(data_block_iterator(Range),
                                      data_block_iterator()));
  }
  return ChangeStatus::NoChange;
}

ChangeStatus Section::ByteIntervalObserverImpl::changeExtent(
    ByteInterval* BI, std::function<void(ByteInterval*)> Callback) {
  auto& Index = S->ByteIntervals.get<by_pointer>();
  if (auto It = Index.find(BI); It != Index.end()) {
    S->removeByteIntervalAddrs(BI);
    Index.modify(It, Callback);
    S->insertByteIntervalAddrs(BI);
  }

  return S->updateExtent();
}


================================================
FILE: src/Serialization.cpp
================================================
//===- Serialization.cpp ----------------------------------------*- C++ -*-===//
//
//  Copyright (C) 2020 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
#include "Serialization.hpp"
#include <gtirb/Node.hpp>

namespace gtirb {
bool uuidFromBytes(const std::string& Bytes, UUID& Uuid) {
  if (Bytes.size() == sizeof(Uuid)) {
    std::copy(Bytes.begin(), Bytes.end(), std::begin(Uuid));
    return true;
  }
  return false;
}

void uuidToBytes(UUID Uuid, std::string& Bytes) {
  Bytes.clear();
  Bytes.reserve(sizeof(Uuid));
  std::copy(std::begin(Uuid), std::end(Uuid), std::back_inserter(Bytes));
}

void nodeUUIDToBytes(const Node* Node, std::string& Bytes) {
  uuidToBytes(Node->getUUID(), Bytes);
}

uint64_t toProtobuf(const Addr Val) { return static_cast<uint64_t>(Val); }

std::string toProtobuf(const std::string& Val) { return Val; }

int64_t toProtobuf(const int64_t& Val) { return Val; }

uint64_t toProtobuf(const uint64_t& Val) { return Val; }

std::string toProtobuf(const UUID& Val) {
  std::string Result;
  uuidToBytes(Val, Result);
  return Result;
}

bool fromProtobuf(Context&, Addr& Result, const uint64_t& Message) {
  Result = Addr(Message);
  return true;
}

bool fromProtobuf(Context&, UUID& Result, const std::string& Message) {
  return uuidFromBytes(Message, Result);
}

} // namespace gtirb


================================================
FILE: src/Serialization.hpp
================================================
//===- Serialization.hpp ----------------------------------------*- C++ -*-===//
//
//  Copyright (C) 2020 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
#ifndef GTIRB_SERIALIZATION_H
#define GTIRB_SERIALIZATION_H

#include <gtirb/Addr.hpp>
#include <gtirb/Node.hpp>
#include <gtirb/Offset.hpp>
#include <google/protobuf/map.h>
#include <google/protobuf/repeated_field.h>
#include <type_traits>

// Utilities for serialization

namespace gtirb {
/// \brief Create UUID from string containing raw bytes.
///
/// \param Bytes  A string containing the raw bytes of the UUID.
/// \param Uuid   A reference to the resulting UUID.
///
/// \return true if the bytes can be decoded into a UUID, false otherwise.
bool uuidFromBytes(const std::string& Bytes, UUID& Uuid);

/// \brief Copy raw bytes of UUID into a string.
///
/// \param Uuid   The UUID to store.
/// \param Bytes  The string in which to store the UUID bytes.
///
/// \return void
void uuidToBytes(UUID Uuid, std::string& Bytes);

/// \brief Copy raw bytes of Node's UUID into a string.
///
/// \param Node   Store this Node's UUID.
/// \param Bytes  The string in which to store the UUID bytes.
///
/// \return void
void nodeUUIDToBytes(const Node* Node, std::string& Bytes);

// Generic protobuf conversion for IR classes which implement toProtobuf.
template <typename T> typename T::MessageType toProtobuf(const T& Val) {
  typename T::MessageType Message;
  Val.toProtobuf(&Message);
  return Message;
}

// Serialize Addr to uint64_t
uint64_t toProtobuf(const Addr Val);

// Overloads for various standard types
std::string toProtobuf(const std::string& Val);
int64_t toProtobuf(const int64_t& Val);
uint64_t toProtobuf(const uint64_t& Val);
std::string toProtobuf(const UUID& Val);

template <typename T> T& deref_if_ptr(T& V) { return V; }
template <typename T> const T& deref_if_ptr(const T& V) { return V; }
template <typename T> T& deref_if_ptr(T* V) { return *V; }
template <typename T> const T& deref_if_ptr(const T* V) { return *V; }
template <typename T> const T& deref_if_ptr(const std::unique_ptr<T>& V) {
  return *V;
}

template <typename T, typename U>
auto toProtobuf(const std::pair<T, U>& Val) -> google::protobuf::MapPair<
    decltype(toProtobuf(Val.first)),
    decltype(toProtobuf(deref_if_ptr(Val.second)))> {
  return {toProtobuf(Val.first), toProtobuf(deref_if_ptr(Val.second))};
}

// Generic interface for setting up a container. Clear and reserve space
// if the container supports it.
template <typename T>
void initContainer(google::protobuf::RepeatedField<T>* Container, size_t Size) {
  Container->Clear();
  Container->Reserve(static_cast<int>(Size));
}
template <typename T>
void initContainer(google::protobuf::RepeatedPtrField<T>* Container,
                   size_t Size) {
  Container->Clear();
  Container->Reserve(static_cast<int>(Size));
}
template <typename T>
void initContainer(std::vector<T>& Container, size_t Size) {
  Container.clear();
  Container.reserve(Size);
}
template <typename T> void initContainer(T* Container, size_t) {
  Container->clear();
}
template <typename T> void initContainer(T& Container, size_t) {
  Container.clear();
}

// Generic interface for adding elements to a container.
template <typename T>
void addElement(google::protobuf::RepeatedField<T>* Container, T&& Element) {
  Container->Add(std::move(Element));
}
template <typename T>
void addElement(google::protobuf::RepeatedPtrField<T>* Container, T&& Element) {
  *Container->Add() = std::move(Element);
}
template <typename T, typename U>
void addElement(google::protobuf::Map<T, U>* Container,
                typename google::protobuf::Map<T, U>::value_type&& Element) {
  Container->insert(std::move(Element));
}
template <typename T> void addElement(std::vector<T>& Container, T&& Element) {
  Container.push_back(std::move(Element));
}
template <typename T, typename U>
void addElement(std::map<T, U>* Container,
                typename std::map<T, U>::value_type&& Element) {
  Container->insert(std::move(Element));
}
template <typename T, typename ContainerType>
std::enable_if_t<std::is_destructible_v<
    decltype(std::declval<ContainerType>().insert(std::declval<T>()))*>>
addElement(ContainerType& Container, T&& Element) {
  Container.insert(std::move(Element));
}

// Convert the contents of a Container into protobuf messages.
template <typename ContainerT, typename MessageT>
void containerToProtobuf(const ContainerT& Values, MessageT* Message) {
  initContainer(Message, Values.size());
  std::for_each(Values.begin(), Values.end(), [Message](const auto& N) {
    addElement(Message, toProtobuf(deref_if_ptr(N)));
  });
}

template <typename IterT, typename MessageT>
void sequenceToProtobuf(IterT First, IterT Last, MessageT* Message) {
  while (First != Last)
    addElement(Message, toProtobuf(deref_if_ptr(*First++)));
}

// Generic conversion from protobuf for IR classes which implement fromProtobuf;
template <typename T, typename U>
T* fromProtobuf(Context& C, const U& Message) {
  return T::fromProtobuf(C, Message);
}

// Generic template for simple types which require no conversion.
template <typename T> bool fromProtobuf(Context&, T& Result, const T& Message) {
  Result = Message;
  return true;
}

inline bool fromProtobuf(Context& C, Offset& Result,
                         const Offset::MessageType& Message) {
  return Result.fromProtobuf(C, Message);
}

/// @cond INTERNAL
namespace details {
template <typename T> struct remove_pointer_ref_quals {
  using type =
      std::remove_pointer_t<std::remove_reference_t<std::remove_cv_t<T>>>;
};
template <typename T>
using remove_pointer_ref_quals_t = typename remove_pointer_ref_quals<T>::type;
} // namespace details
/// @endcond

// Overrides for various other types.
template <typename T, typename U, typename V, typename W>
bool fromProtobuf(Context& C, std::pair<T, U>& Val,
                  const google::protobuf::MapPair<V, W>& Message) {
  return fromProtobuf(C, Val.first, Message.first) &&
         fromProtobuf(C, Val.second, Message.second);
}

bool fromProtobuf(Context&, Addr& Result, const uint64_t& Message);
bool fromProtobuf(Context&, UUID& Result, const std::string& Message);

// Convert the contents for a Container into IR classes; does not participate
// in overload resolution if the container stores Node subclasses.
template <typename ContainerT, typename MessageT>
bool containerFromProtobuf(
    Context& C, ContainerT& Values, MessageT& Message,
    std::enable_if_t<
        !std::is_base_of_v<Node, details::remove_pointer_ref_quals_t<
                                     typename ContainerT::value_type>>>* =
        nullptr) {
  initContainer(Values, Message.size());
  std::for_each(Message.begin(), Message.end(), [&Values, &C](const auto& M) {
    typename ContainerT::value_type Val;
    if (!fromProtobuf(C, Val, M))
      return false;
    addElement(Values, std::move(Val));
  });
  return true;
}

// Convert the contents for a Container into IR classes. Only participates in
// overload resolution if the container stores Node subclasses.
template <typename ContainerT, typename MessageT>
bool containerFromProtobuf(
    Context& C, ContainerT& Values, MessageT& Message,
    std::enable_if_t<
        std::is_base_of_v<Node, details::remove_pointer_ref_quals_t<
                                    typename ContainerT::value_type>>>* =
        nullptr) {
  using BaseType =
      details::remove_pointer_ref_quals_t<typename ContainerT::value_type>;
  initContainer(Values, Message.size());
  std::for_each(Message.begin(), Message.end(), [&Values, &C](const auto& M) {
    BaseType* Elem = BaseType::fromProtobuf(C, M);
    if (!Elem)
      return false;
    addElement(Values, Elem);
  });
  return true;
}

// Special case for std::map
template <typename KeyType, typename ValueType, typename MessageT>
bool containerFromProtobuf(Context& C, std::map<KeyType, ValueType>& Values,
                           MessageT& Message) {
  Values.clear();
  std::for_each(Message.begin(), Message.end(), [&Values, &C](const auto& M) {
    // NOTE: if we could use MapT::value_type here, then this could
    // all be rolled into containerFromProtobuf. But that gives us a
    // pair where the first Element is const, so we can't pass it to
    // fromProtobuf().
    std::pair<KeyType, ValueType> Val;
    if (!fromProtobuf(C, Val, M))
      return false;
    Values.insert(std::move(Val));
  });
  return true;
}
} // namespace gtirb

#endif // GTIRB_SERIALIZATION_H


================================================
FILE: src/Symbol.cpp
================================================
//===- Symbol.cpp -----------------------------------------------*- C++ -*-===//
//
//  Copyright (C) 2020 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
#include "Symbol.hpp"
#include "IR.hpp"
#include "Serialization.hpp"
#include <gtirb/ByteInterval.hpp>
#include <gtirb/CodeBlock.hpp>
#include <gtirb/DataBlock.hpp>
#include <gtirb/proto/Symbol.pb.h>

using namespace gtirb;

class StorePayload {
public:
  StorePayload(proto::Symbol* Message) : M(Message) {}
  void operator()(std::monostate) const { M->clear_value(); }
  void operator()(Addr X) const { M->set_value(static_cast<uint64_t>(X)); }
  void operator()(const Node* Referent) const {
    nodeUUIDToBytes(Referent, *M->mutable_referent_uuid());
  }

private:
  proto::Symbol* M;
};

std::optional<Addr> Symbol::getAddress() const {
  return std::visit(
      [this](const auto& Arg) -> std::optional<Addr> {
        using T = std::decay_t<decltype(Arg)>;
        if constexpr (std::is_same_v<T, std::monostate>) {
          return std::nullopt;
        } else if constexpr (std::is_same_v<T, Addr>) {
          return Arg;
        } else if constexpr (std::is_same_v<T, Node*>) {
          if (auto* B = dyn_cast_or_null<CodeBlock>(Arg)) {
            if (auto A = B->getAddress()) {
              return *A + (AtEnd ? B->getSize() : 0);
            } else {
              return std::nullopt;
            }
          } else if (auto* D = dyn_cast_or_null<DataBlock>(Arg)) {
            if (auto A = D->getAddress()) {
              return *A + (AtEnd ? D->getSize() : 0);
            } else {
              return std::nullopt;
            }
          } else if (auto* P = dyn_cast_or_null<ProxyBlock>(Arg)) {
            return std::nullopt;
          } else {
            assert(Arg == nullptr && "unsupported referent type");
          }
          return std::nullopt;
        } else {
          static_assert(
              // Assert condition must depend on T, but will always be false.
              std::bool_constant<!std::is_same_v<T, T>>::value,
              "unsupported symbol payload type");
        }
      },
      Payload);
}

void Symbol::toProtobuf(MessageType* Message) const {
  nodeUUIDToBytes(this, *Message->mutable_uuid());
  std::visit(StorePayload(Message), Payload);
  Message->set_name(this->Name);
  Message->set_at_end(this->AtEnd);
}

ErrorOr<Symbol*> Symbol::fromProtobuf(Context& C, const MessageType& Message) {
  UUID Id;
  if (!uuidFromBytes(Message.uuid(), Id))
    return {IR::load_error::BadUUID, "could not load Symbol"};

  Symbol* S = Symbol::Create(C, Message.name(), Message.at_end(), Id);

  switch (Message.optional_payload_case()) {
  case proto::Symbol::kValue: {
    S->Payload = Addr{Message.value()};
  } break;
  case proto::Symbol::kReferentUuid: {
    if (uuidFromBytes(Message.referent_uuid(), Id)) {
      if (auto* N = Node::getByUUID(C, Id)) {
        S->Payload = N;
      } else {
        S->Payload = std::monostate{};
      }
    } else {
      return nullptr;
    }
  } break;
  default:
      /* nothing to do */;
  }
  return S;
}

// Present for testing purposes only.
void Symbol::save(std::ostream& Out) const {
  MessageType Message;
  this->toProtobuf(&Message);
  Message.SerializeToOstream(&Out);
}

// Present for testing purposes only.
Symbol* Symbol::load(Context& C, std::istream& In) {
  MessageType Message;
  Message.ParseFromIstream(&In);
  auto S = Symbol::fromProtobuf(C, Message);
  if (S)
    return *S;
  return nullptr;
}


================================================
FILE: src/SymbolicExpression.cpp
================================================
//===- SymbolicExpression.cpp -----------------------------------*- C++ -*-===//
//
//  Copyright (C) 2020 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
#include "SymbolicExpression.hpp"
#include "Serialization.hpp"
#include <gtirb/Context.hpp>
#include <gtirb/Symbol.hpp>
#include <gtirb/proto/SymbolicExpression.pb.h>
#include <variant>

namespace gtirb {

static void symAttributeSetToProtobuf(const SymAttributeSet& SASet,
                                      proto::SymbolicExpression* Message) {
  for (auto Attr : SASet) {
    Message->add_attribute_flags(static_cast<proto::SymAttribute>(Attr));
  }
}

static SymAttributeSet
symAttributeSetFromProtobuf(const proto::SymbolicExpression& Message) {
  SymAttributeSet SASet;
  for (int I = 0, E = Message.attribute_flags_size(); I != E; ++I) {
    SASet.insert(static_cast<SymAttribute>(Message.attribute_flags(I)));
  }
  return SASet;
}

class SymbolicVisitor {
public:
  proto::SymbolicExpression* Message;

  SymbolicVisitor(proto::SymbolicExpression* M) : Message(M) {}

  void operator()(const SymAddrConst& Val) const {
    auto M = Message->mutable_addr_const();
    M->set_offset(Val.Offset);
    if (Val.Sym) {
      uuidToBytes(Val.Sym->getUUID(), *M->mutable_symbol_uuid());
    }
    symAttributeSetToProtobuf(Val.Attributes, Message);
  }

  void operator()(const SymAddrAddr& Val) const {
    auto M = Message->mutable_addr_addr();
    M->set_scale(Val.Scale);
    M->set_offset(Val.Offset);
    if (Val.Sym1) {
      uuidToBytes(Val.Sym1->getUUID(), *M->mutable_symbol1_uuid());
    }
    if (Val.Sym2) {
      uuidToBytes(Val.Sym2->getUUID(), *M->mutable_symbol2_uuid());
    }
    symAttributeSetToProtobuf(Val.Attributes, Message);
  }
};

proto::SymbolicExpression toProtobuf(const SymbolicExpression& Value) {
  proto::SymbolicExpression Message;
  std::visit(SymbolicVisitor(&Message), Value);
  return Message;
}

namespace {
Symbol* symbolFromProto(Context& C, const std::string& Bytes) {
  if (UUID Id; !Bytes.empty() && uuidFromBytes(Bytes, Id))
    return dyn_cast_or_null<Symbol>(Node::getByUUID(C, Id));
  return nullptr;
}
} // namespace

bool fromProtobuf(Context& C, SymbolicExpression& Result,
                  const proto::SymbolicExpression& Message) {
  switch (Message.value_case()) {
  case proto::SymbolicExpression::kAddrConst: {
    const auto& Val = Message.addr_const();
    Result = SymAddrConst{Val.offset(), symbolFromProto(C, Val.symbol_uuid()),
                          symAttributeSetFromProtobuf(Message)};
    return std::get<SymAddrConst>(Result).Sym != nullptr;
  }
  case proto::SymbolicExpression::kAddrAddr: {
    const auto& Val = Message.addr_addr();
    Result = SymAddrAddr{Val.scale(), Val.offset(),
                         symbolFromProto(C, Val.symbol1_uuid()),
                         symbolFromProto(C, Val.symbol2_uuid()),
                         symAttributeSetFromProtobuf(Message)};
    return std::get<SymAddrAddr>(Result).Sym1 != nullptr &&
           std::get<SymAddrAddr>(Result).Sym2 != nullptr;
  }
  case proto::SymbolicExpression::VALUE_NOT_SET:
    assert(false && "unknown symbolic expression kind");
  }
  return false;
}

// This function is defined here w/ GTIRB_EXPORT_API to provide a
// means for test code to directly invoke serialization routines on a
// CFG. This is a capability not supported for GTIRB clients, but must
// be made available to the testing system.
void GTIRB_EXPORT_API symbolicExpressionSave(const SymbolicExpression& SE,
                                             std::ostream& Out) {
  proto::SymbolicExpression Message = toProtobuf(SE);
  Message.SerializeToOstream(&Out);
}

// This function is defined here w/ GTIRB_EXPORT_API to provide a
// means for test code to directly invoke serialization routines on a
// CFG. This is a capability not supported for GTIRB clients, but must
// be made available to the testing system.
void GTIRB_EXPORT_API symbolicExpressionLoad(Context& C,
                                             SymbolicExpression& Result,
                                             std::istream& In) {
  proto::SymbolicExpression Message;
  Message.ParseFromIstream(&In);
  fromProtobuf(C, Result, Message);
}

} // namespace gtirb


================================================
FILE: src/SymbolicExpressionSerialization.hpp
================================================
//===- SymbolicExpressionSerialization.hpp ----------------------*- C++ -*-===//
//
//  Copyright (C) 2020 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//

#ifndef GTIRB_SYMBOLIC_EXPRESSION_SERIALIZATION_HPP
#define GTIRB_SYMBOLIC_EXPRESSION_SERIALIZATION_HPP

#include <gtirb/SymbolicExpression.hpp>

namespace gtirb {
namespace proto {
class SymbolicExpression;
}
class Context;

/// @cond INTERNAL
/// \brief Initialize a SymbolicExpression from a protobuf message.
///
/// \param      C        The Context in which the deserialized
///                      SymbolicExpression will be held.
/// \param      Message  The protobuf message from which to deserialize.
/// \param[out] Result   The SymbolicExpression to initialize.
///
/// \return true if the expression could be deserialized from protobuf, false
/// otherwise.
bool fromProtobuf(Context& C, SymbolicExpression& Result,
                  const proto::SymbolicExpression& Message);

/// \brief Serialize a SymbolicExpression into a protobuf message.
///
/// \param Value   The SymbolicExpression to serialize.
///
/// \return A protobuf message representing the SymbolicExpression.
proto::SymbolicExpression toProtobuf(const SymbolicExpression& Value);

/// @endcond

} // namespace gtirb

#endif // GTIRB_SYMBOLIC_EXPRESSION_SERIALIZATION_HPP


================================================
FILE: src/Utility.cpp
================================================
#include "Utility.hpp"

#include <gtirb/Casting.hpp>
#include <gtirb/CodeBlock.hpp>
#include <gtirb/DataBlock.hpp>

using namespace gtirb;

static inline auto codeBlockSecondaryKey(const CodeBlock* B) {
  return std::make_tuple(B->getSize(), B->getKind(), B->getDecodeMode(),
                         B->getUUID());
}

static inline auto dataBlockSecondaryKey(const DataBlock* B) {
  // Include a dummy "decode mode" to match the key type for CodeBlocks for
  // blockKey().
  return std::make_tuple(B->getSize(), B->getKind(), DecodeMode::Default,
                         B->getUUID());
}

inline auto blockSecondaryKey(const Node* N) {
  if (const auto* CB = dyn_cast<CodeBlock>(N)) {
    return codeBlockSecondaryKey(CB);
  } else {
    auto* DB = cast<DataBlock>(N);
    return dataBlockSecondaryKey(DB);
  }
}

static inline auto codeBlockAddressKey(const CodeBlock* B) {
  return std::make_tuple(B->getAddress(), codeBlockSecondaryKey(B));
}

static inline auto dataBlockAddressKey(const DataBlock* B) {
  return std::make_tuple(B->getAddress(), dataBlockSecondaryKey(B));
}

static inline auto blockAddressKey(const Node* N) {
  if (const auto* CB = dyn_cast<CodeBlock>(N)) {
    return codeBlockAddressKey(CB);
  } else {
    auto* DB = cast<DataBlock>(N);
    return dataBlockAddressKey(DB);
  }
}

template <>
bool AddressLess::operator()<CodeBlock>(const CodeBlock* B1,
                                        const CodeBlock* B2) const {
  return codeBlockAddressKey(B1) < codeBlockAddressKey(B2);
}

template <>
bool AddressLess::operator()<DataBlock>(const DataBlock* B1,
                                        const DataBlock* B2) const {
  return dataBlockAddressKey(B1) < dataBlockAddressKey(B2);
}

bool BlockAddressLess::operator()(const Node* N1, const Node* N2) const {
  return blockAddressKey(N1) < blockAddressKey(N2);
}

bool BlockOffsetPairLess::operator()(
    std::pair<uint64_t, const Node*> B1,
    std::pair<uint64_t, const Node*> B2) const {
  return std::make_tuple(B1.first, blockSecondaryKey(B1.second)) <
         std::make_tuple(B2.first, blockSecondaryKey(B2.second));
}


================================================
FILE: src/gtirb/proto/CMakeLists.txt
================================================
if(${CMAKE_CXX_COMPILER_ID} STREQUAL MSVC)
  add_compile_options(-wd4146) # unary minus operator applied to unsigned type,
                               # result still unsigned
  add_compile_options(-wd4125) # decimal digit terminates octal escape sequence
  add_compile_options(-wd4456) # declaration of 'decl' hides previous local
                               # declaration
  add_compile_options(-wd4100) # unreferenced formal parameter
  add_compile_options(-wd4267) # conversion from 'type1' to 'type2', possible
                               # loss of data
  add_compile_options(-wd4244) # possible loss of data in conversion
  add_compile_options(-wd4127) # conditional expression is constant
  add_compile_options(
    -wd4251
  ) # 'identifier' : class 'type' needs to have dll- interface to be used by
    # clients of class 'type2'
  add_compile_options(-wd4275) # Non-dll interface base classes.
  add_compile_options("/FI${CMAKE_SOURCE_DIR}/include/gtirb/Export.hpp")
else()
  add_compile_options(-Wno-shadow)
  add_compile_options(-Wno-unused-parameter)
  add_compile_options(-include "${CMAKE_SOURCE_DIR}/include/gtirb/Export.hpp")
endif()

protobuf_generate_cpp(PROTO_CPP_SOURCES PROTO_CPP_HEADERS ${GTIRB_PROTO_FILES})

# Copy headers to the right place
add_custom_command(
  OUTPUT "${CMAKE_BINARY_DIR}/include/gtirb/proto"
  COMMAND "${CMAKE_COMMAND}" -E make_directory
          "${CMAKE_BINARY_DIR}/include/gtirb/proto"
)

foreach(PROTO_H ${PROTO_CPP_HEADERS})
  get_filename_component(PROTO_H_NAME "${PROTO_H}" NAME)
  set(COPIED_PROTO_H "${CMAKE_BINARY_DIR}/include/gtirb/proto/${PROTO_H_NAME}")
  list(APPEND PROTO_COPIED_HEADERS "${COPIED_PROTO_H}")

  add_custom_command(
    DEPENDS "${PROTO_H}"
    OUTPUT "${COPIED_PROTO_H}"
    COMMAND "${CMAKE_COMMAND}" -E copy "${PROTO_H}" "${COPIED_PROTO_H}"
  )
endforeach(PROTO_H)

# Add proto library target
add_library(gtirb_proto STATIC ${PROTO_CPP_SOURCES} ${PROTO_COPIED_HEADERS})

target_link_libraries(gtirb_proto ${Boost_LIBRARIES} ${Protobuf_LIBRARIES})

target_compile_definitions(gtirb_proto PRIVATE GTIRB_${PROJECT_NAME}_EXPORTS)

include_directories(SYSTEM "${PROTOBUF_INCLUDE_DIRS}")
target_include_directories(
  gtirb_proto PUBLIC $<BUILD_INTERFACE:${CMAKE_BINARY_DIR}/include>
)

install(
  TARGETS gtirb_proto
  COMPONENT proto_library
  EXPORT gtirbTargets
  ARCHIVE DESTINATION lib
  LIBRARY DESTINATION lib
)


================================================
FILE: src/test/Addr.test.cpp
================================================
//===- Addr.test.cpp --------------------------------------------*- C++ -*-===//
//
//  Copyright (C) 2020 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
#include <gtirb/Addr.hpp>
#include <gtirb/ByteInterval.hpp>
#include <gtirb/CodeBlock.hpp>
#include <gtirb/Context.hpp>
#include <gtirb/Section.hpp>
#include <gtest/gtest.h>
#include <sstream>

using namespace gtirb;

static Context Ctx;

TEST(Unit_Addr, ctor_0) { EXPECT_EQ(Addr(), Addr()); }

TEST(Unit_Addr, ctor_1) {
  auto Ea = Addr(2112);
  EXPECT_EQ(2112, uint64_t(Ea));
}

TEST(Unit_Addr, fromIntegers) {
  uint64_t U64 = 1;
  Addr U64Addr(U64);
  EXPECT_EQ(uint64_t(U64Addr), U64);

  int64_t S64 = 2;
  Addr S64Addr(S64);
  EXPECT_EQ(uint64_t(S64Addr), S64);
}

TEST(Unit_Addr, toIntegers) {
  Addr Ea(1);
  EXPECT_EQ(static_cast<uint64_t>(Ea), static_cast<uint64_t>(1));
  EXPECT_EQ(static_cast<uint64_t>(Ea), static_cast<int64_t>(1));
}

TEST(Unit_Addr, comparison) {
  Addr Ea1(2112), Ea2(1221), Ea3(1000), Ea4(1000);

  EXPECT_EQ(Ea3, Ea4);
  EXPECT_TRUE(Ea3 == Ea4);
  EXPECT_FALSE(Ea3 != Ea4);

  EXPECT_NE(Ea1, Ea2);
  EXPECT_TRUE(Ea1 != Ea2);
  EXPECT_FALSE(Ea1 == Ea2);

  EXPECT_LT(Ea2, Ea1);
  EXPECT_TRUE(Ea2 < Ea1);
  EXPECT_FALSE(Ea2 > Ea1);

  EXPECT_GT(Ea1, Ea2);
  EXPECT_TRUE(Ea1 > Ea2);
  EXPECT_FALSE(Ea1 < Ea2);

  EXPECT_LE(Ea3, Ea4);
  EXPECT_TRUE(Ea3 <= Ea4);
  EXPECT_FALSE(Ea3 > Ea4);

  EXPECT_GE(Ea3, Ea4);
  EXPECT_TRUE(Ea3 >= Ea4);
  EXPECT_FALSE(Ea3 < Ea4);
}

TEST(Unit_Addr, arithmetic) {
  Addr Ea(10);

  EXPECT_EQ(Ea + 5, Addr(15));
  EXPECT_EQ(Ea - Addr(5), 5);
  EXPECT_EQ(Ea - 5, Addr(5));

  EXPECT_EQ(++Ea, Addr(11));
  EXPECT_EQ(--Ea, Addr(10));

  EXPECT_EQ(Ea++, Addr(10));
  EXPECT_EQ(Ea, Addr(11));

  EXPECT_EQ(Ea--, Addr(11));
  EXPECT_EQ(Ea, Addr(10));

  EXPECT_EQ(Ea += 5, Addr(15));
  EXPECT_EQ(Ea -= 5, Addr(10));
}

TEST(Unit_Addr, ostream) {
  std::ostringstream Os;

  Os << 123 << " 0x" << std::hex << static_cast<uint64_t>(Addr(456)) << std::dec
     << " 789";
  EXPECT_EQ(Os.str(), "123 0x1c8 789");

  Os.str({});
  Os << 987 << " " << Addr(654) << " 321";
  EXPECT_EQ(Os.str(), "987 0x28e 321");
}

TEST(Unit_Addr, Constexpr) {
  // Test constexpr equality.
  static_assert(Addr(10) == Addr(10));
  static_assert(noexcept(Addr(10) == Addr(10)));
  static_assert(Addr(10) != Addr(1));
  static_assert(noexcept(Addr(10) != Addr(1)));

  // Test constexpr conversion to int.
  static_assert((uint64_t)Addr(10) == 10);
  static_assert(noexcept((uint64_t)Addr(10)));

  // Test constexpr comparisons.
  static_assert(Addr(1) < Addr(10));
  static_assert(noexcept(Addr(1) < Addr(10)));
  static_assert(Addr(10) > Addr(1));
  static_assert(noexcept(Addr(10) > Addr(1)));
  static_assert(Addr(2) <= Addr(2));
  static_assert(noexcept(Addr(2) <= Addr(2)));
  static_assert(Addr(2) >= Addr(2));
  static_assert(noexcept(Addr(2) >= Addr(2)));

  // Test constexpr increment and decrement.
  static_assert(++Addr(2) == Addr(3));
  static_assert(noexcept(++Addr(2)));
  static_assert(--Addr(2) == Addr(1));
  static_assert(noexcept(--Addr(2)));
  static_assert(Addr(2)++ == Addr(2));
  static_assert(noexcept(Addr(2)++));
  static_assert(Addr(2)-- == Addr(2));
  static_assert(noexcept(Addr(2)--));

  // Test unary operators.
  static_assert(+Addr(12) == Addr(12));
  static_assert(noexcept(+Addr(12)));
  static_assert(~Addr(0) == Addr(std::numeric_limits<Addr::value_type>::max()));
  static_assert(noexcept(~Addr(0)));

  // Test arithmetic operators.
  static_assert(Addr(10) + 1 == Addr(11));
  static_assert(noexcept(Addr(10) + 1));
  static_assert(1 + Addr(10) == Addr(11));
  static_assert(noexcept(1 + Addr(10)));
  static_assert(Addr(10) - 1 == Addr(9));
  static_assert(noexcept(Addr(10) - 1));
  static_assert(Addr(10) - Addr(9) == 1);
  static_assert(noexcept(Addr(10) - Addr(9)));

  // Test arithmetic compound assignment operators.
  static_assert((Addr(10) += 1) == Addr(11));
  static_assert(noexcept(Addr(10) += 1));
  static_assert((Addr(10) -= 1) == Addr(9));
  static_assert(noexcept(Addr(10) -= 1));

  // Ensure that wrapping happens at compile time, in either direction, without
  // triggering undefined behavior. Note, this explicitly disables compiler
  // diagnostics about overflow as those may be warned on even with well-defined
  // semantics.
#if defined(_MSC_VER)
#pragma warning(push)
#pragma warning(disable : 4307) // '+': integral constant overflow
#endif
  static_assert(Addr(0) - 1 ==
                Addr(std::numeric_limits<Addr::value_type>::max()));
  static_assert(noexcept(Addr(0) - 1));
  static_assert(Addr(std::numeric_limits<Addr::value_type>::max()) + 1 ==
                Addr(0));
  static_assert(
      noexcept(Addr(std::numeric_limits<Addr::value_type>::max()) + 1));
#if defined(_MSC_VER)
#pragma warning(pop)
#endif
}

TEST(Unit_Addr, addressLimit) {
  auto* BI = ByteInterval::Create(Ctx, 10);
  EXPECT_EQ(addressLimit(*BI), std::nullopt);

  BI->setAddress(Addr(0));
  auto* CB = BI->addBlock<CodeBlock>(Ctx, 0, 5);

  EXPECT_EQ(addressLimit(*BI), Addr(10));
  EXPECT_EQ(addressLimit(*CB), Addr(5));

  auto* S = Section::Create(Ctx, "");
  EXPECT_EQ(addressLimit(*S), std::nullopt);

  S->addByteInterval(BI);
  EXPECT_EQ(addressLimit(*S), Addr(10));
}

TEST(Unit_Addr, hash) {
  std::unordered_set<Addr> Addrs{Addr(0), Addr(10), Addr(10)};
  EXPECT_EQ(Addrs.size(), 2);
}


================================================
FILE: src/test/Allocator.test.cpp
================================================
//===- Allocator.test.cpp ---------------------------------------*- C++ -*-===//
//
//  Copyright (C) 2020 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//

#include <gtirb/Allocator.hpp>
#include <array>
#include <gtest/gtest.h>

class AllocTest {
public:
  static size_t CtorCount;
  static size_t DtorCount;

  AllocTest() { CtorCount++; }
  ~AllocTest() { DtorCount++; }

  std::array<char, 7> Data; // Take up some space
};
size_t AllocTest::CtorCount = 0;
size_t AllocTest::DtorCount = 0;

using namespace ::gtirb;
using Allocator = SpecificBumpPtrAllocator<AllocTest>;

inline void* operator new(size_t, Allocator& A) { return A.Allocate(); }
inline void operator delete(void*, Allocator&) {}

TEST(Unit_Allocator, allocate) {
  AllocTest::CtorCount = AllocTest::DtorCount = 0;
  Allocator A;
  EXPECT_NE(new (A) AllocTest, nullptr);
  EXPECT_NE(new (A) AllocTest, nullptr);
  EXPECT_NE(new (A) AllocTest, nullptr);
  EXPECT_EQ(AllocTest::CtorCount, 3);
}

TEST(Unit_Allocator, deallocate) {
  // For varying numbers of allocations, ensure that destructors are called.
  for (int AllocCount = 0; AllocCount < 100; AllocCount++) {
    AllocTest::CtorCount = AllocTest::DtorCount = 0;
    {
      Allocator A;
      EXPECT_NE(new (A) AllocTest, nullptr);
      EXPECT_NE(new (A) AllocTest, nullptr);
      EXPECT_NE(new (A) AllocTest, nullptr);
      EXPECT_EQ(AllocTest::DtorCount, 0);
    }
    // All objects destroyed when allocator goes out of scope
    EXPECT_EQ(AllocTest::DtorCount, AllocTest::CtorCount);
  }
}


================================================
FILE: src/test/AuxData.test.cpp
================================================
//===- AuxData.test.cpp ----------------------------------------*- C++-*-===//
//
//  Copyright (C) 2020 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
#include "SerializationTestHarness.hpp"
#include <gtirb/AuxData.hpp>
#include <gtirb/Context.hpp>
#include <gtirb/proto/AuxData.pb.h>
#include <gtest/gtest.h>
#include <memory>
#include <sstream>

struct MoveTest;

namespace gtirb {
namespace schema {

struct MapAddrToString {
  static constexpr const char* Name = "std::map<Addr, std::string>";
  typedef std::map<Addr, std::string> Type;
};

struct MapInt64ToString {
  static constexpr const char* Name = "std::map<int64_t, std::string>";
  typedef std::map<int64_t, std::string> Type;
};

struct MapStringToString {
  static constexpr const char* Name = "std::map<std::string, std::string>";
  typedef std::map<std::string, std::string> Type;
};

struct MapUUIDToString {
  static constexpr const char* Name = "std::map<UUID, std::string>";
  typedef std::map<UUID, std::string> Type;
};

struct VectorMapStringToInt {
  static constexpr const char* Name = "std::vector<std::map<std::string, int>>";
  typedef std::vector<std::map<std::string, int>> Type;
};

struct VectorAddr {
  static constexpr const char* Name = "std::vector<Addr>";
  typedef std::vector<Addr> Type;
};

struct VectorInt64 {
  static constexpr const char* Name = "std::vector<int64_t>";
  typedef std::vector<int64_t> Type;
};

struct VectorString {
  static constexpr const char* Name = "std::vector<std::string>";
  typedef std::vector<std::string> Type;
};

struct VectorUUID {
  static constexpr const char* Name = "std::vector<UUID>";
  typedef std::vector<UUID> Type;
};

struct SetUUID {
  static constexpr const char* Name = "std::unordered_set<UUID>";
  typedef std::unordered_set<UUID> Type;
};

struct AString {
  static constexpr const char* Name = "A string type";
  typedef std::string Type;
};

struct AnAddr {
  static constexpr const char* Name = "Addr";
  typedef Addr Type;
};

struct MapCharToInt64 {
  static constexpr const char* Name = "std::map<char, int64_t>";
  typedef std::map<char, int64_t> Type;
};

struct SetOfInt {
  static constexpr const char* Name = "Set of int";
  typedef std::set<int> Type;
};

struct TupleOfCharAndInt64 {
  static constexpr const char* Name = "Tuple of char and int64";
  typedef std::tuple<char, int64_t> Type;
};

struct TupleOfCharOrAddr {
  static constexpr const char* Name = "3-Tuple of variant<Addr,char>";
  typedef std::variant<Addr, char> VarT;
  typedef std::tuple<VarT, VarT, VarT> Type;
};

struct PairOfCharAndInt64 {
  static constexpr const char* Name = "Pair of char and int64";
  typedef std::pair<char, int64_t> Type;
};

struct AnInt64 {
  static constexpr const char* Name = "A 64-bit integer";
  typedef int64_t Type;
};

struct AnInt32 {
  static constexpr const char* Name = "A 32-bit integer";
  typedef int32_t Type;
};

struct AnDouble {
  static constexpr const char* Name = "A 64-bit float";
  typedef double Type;
};

struct AnFloat {
  static constexpr const char* Name = "A 32-bit float";
  typedef float Type;
};

struct ListInt64 {
  static constexpr const char* Name = "A list of 64-bit integers";
  typedef std::list<int64_t> Type;
};

struct AUUID {
  static constexpr const char* Name = "A UUID";
  typedef UUID Type;
};

struct AChar {
  static constexpr const char* Name = "A char";
  typedef char Type;
};

struct AUint64 {
  static constexpr const char* Name = "A 64-bit unsigned integer";
  typedef uint64_t Type;
};

struct AUint8 {
  static constexpr const char* Name = "An 8-bit unsigned integer";
  typedef uint8_t Type;
};

struct AnInt {
  static constexpr const char* Name = "A plain int";
  typedef int Type;
};

struct AnUnsigned {
  static constexpr const char* Name = "A plain unsigned";
  typedef unsigned Type;
};

struct ABool {
  static constexpr const char* Name = "A bool";
  typedef bool Type;
};

struct AByte {
  static constexpr const char* Name = "A byte";
  typedef std::byte Type;
};

struct AnOffset {
  static constexpr const char* Name = "An offset";
  typedef Offset Type;
};

struct VectorOfMapOfTuple {
  static constexpr const char* Name = "A complex data structure";
  typedef std::vector<std::map<char, std::tuple<int64_t, uint64_t>>> Type;
};

struct MapOfVector {
  static constexpr const char* Name = "Another complex data structure";
  typedef std::map<std::string, std::vector<int64_t>> Type;
};

struct TupleOfVector {
  static constexpr const char* Name = "And another complex data structure";
  typedef std::tuple<std::string, std::vector<int64_t>> Type;
};

struct AMoveTest {
  static constexpr const char* Name = "A MoveTest";
  typedef MoveTest Type;
};

struct SimpleVariant {
  static constexpr const char* Name =
      "Simple variant of uint8_t, int32_t and Addr";
  typedef std::variant<uint8_t, int32_t, Addr> Type;
};

struct OtherSimpleVariant {
  static constexpr const char* Name = "another simple variant";
  typedef std::variant<Addr, char> Type;
};

struct ComplexVariant {
  using Map = std::map<std::string, std::vector<int64_t>>;
  static constexpr const char* Name =
      "Complex variant of uint8_t, int32_t and complex map";
  typedef std::variant<uint8_t, int32_t, Map> Type;
};

struct DuplicateVariant {
  static constexpr const char* Name =
      "Variant with fields distinguished by position only";
  typedef std::variant<uint16_t, int16_t, uint16_t> Type;
};

struct MapCharToVariant {
  static constexpr const char* Name = "std::map<char,std::variant<Addr,char>>";
  typedef std::map<char, std::variant<Addr, char>> Type;
};

struct VecOfVariants {
  static constexpr const char* Name = "std::vector<std::variant<Addr, char>>";
  typedef std::vector<std::variant<Addr, char>> Type;
};

} // namespace schema
} // namespace gtirb

using namespace gtirb;
using namespace gtirb::schema;

static Context Ctx;

TEST(Unit_AuxData, eaMapProtobufRoundTrip) {
  using STH = gtirb::SerializationTestHarness;
  using MapT = std::map<Addr, std::string>;
  AuxDataImpl<MapAddrToString> Original =
      MapT({{Addr(1), {"a"}}, {Addr(2), {"b"}}});

  std::stringstream ss;
  STH::save(Original, ss);
  auto Intermediate = STH::load<AuxDataImpl<MapAddrToString>>(Ctx, ss);
  // Test that deserialized data can be reserialized again.
  std::stringstream ss2;
  STH::save(*Intermediate, ss2);
  auto Result = STH::load<AuxDataImpl<MapAddrToString>>(Ctx, ss2);

  const MapT* M = Result->get();
  EXPECT_TRUE(M);
  EXPECT_EQ(M->size(), 2);
  EXPECT_EQ(M->at(Addr(1)), "a");
  EXPECT_EQ(M->at(Addr(2)), "b");
}

TEST(Unit_AuxData, intMapProtobufRoundTrip) {
  using STH = gtirb::SerializationTestHarness;
  using MapT = std::map<int64_t, std::string>;
  AuxDataImpl<MapInt64ToString> Original = MapT({{1, {"a"}}, {2, {"b"}}});

  std::stringstream ss;
  STH::save(Original, ss);
  auto Result = STH::load<AuxDataImpl<MapInt64ToString>>(Ctx, ss);

  MapT M = *Result->get();
  EXPECT_EQ(M.size(), 2);
  EXPECT_EQ(M[1], "a");
  EXPECT_EQ(M[2], "b");
}

TEST(Unit_AuxData, stringMapProtobufRoundTrip) {
  using STH = gtirb::SerializationTestHarness;
  using MapT = std::map<std::string, std::string>;
  AuxDataImpl<MapStringToString> Original = MapT({{"1", {"a"}}, {"2", {"b"}}});

  std::stringstream ss;
  STH::save(Original, ss);
  auto Result = STH::load<AuxDataImpl<MapStringToString>>(Ctx, ss);

  MapT M = *Result->get();
  EXPECT_EQ(M.size(), 2);
  EXPECT_EQ(M["1"], "a");
  EXPECT_EQ(M["2"], "b");
}

TEST(Unit_AuxData, uuidMapProtobufRoundTrip) {
  using STH = gtirb::SerializationTestHarness;
  using MapT = std::map<UUID, std::string>;
  UUID Id1 = Node::Create(Ctx)->getUUID();
  UUID Id2 = Node::Create(Ctx)->getUUID();
  AuxDataImpl<MapUUIDToString> Original = MapT({{Id1, {"a"}}, {Id2, {"b"}}});

  std::stringstream ss;
  STH::save(Original, ss);
  auto Result = STH::load<AuxDataImpl<MapUUIDToString>>(Ctx, ss);

  MapT M = *Result->get();
  EXPECT_EQ(M.size(), 2);
  EXPECT_EQ(M[Id1], "a");
  EXPECT_EQ(M[Id2], "b");
}

TEST(Unit_AuxData, mapVectorProtobufRoundTrip) {
  using STH = gtirb::SerializationTestHarness;
  auto Val = std::vector<std::map<std::string, int>>{{{"key", {1}}}};
  auto ValOrig = Val;

  AuxDataImpl<VectorMapStringToInt> Original(std::move(Val));
  std::stringstream ss;
  STH::save(Original, ss);
  auto Result = STH::load<AuxDataImpl<VectorMapStringToInt>>(Ctx, ss);

  auto New = *Result->get();
  EXPECT_EQ(New, ValOrig);
}

TEST(Unit_AuxData, eaVectorProtobufRoundTrip) {
  using STH = gtirb::SerializationTestHarness;
  AuxDataImpl<VectorAddr> Original =
      std::vector<Addr>({Addr(1), Addr(2), Addr(3)});

  std::stringstream ss;
  STH::save(Original, ss);
  auto Result = STH::load<AuxDataImpl<VectorAddr>>(Ctx, ss);

  EXPECT_EQ(*Result->get(), std::vector<Addr>({Addr(1), Addr(2), Addr(3)}));
}

TEST(Unit_AuxData, intVectorProtobufRoundTrip) {
  using STH = gtirb::SerializationTestHarness;
  AuxDataImpl<VectorInt64> Original = std::vector<int64_t>({1, 2, 3});

  std::stringstream ss;
  STH::save(Original, ss);
  auto Result = STH::load<AuxDataImpl<VectorInt64>>(Ctx, ss);

  EXPECT_EQ(*Result->get(), std::vector<int64_t>({1, 2, 3}));
}

TEST(Unit_AuxData, stringVectorProtobufRoundTrip) {
  using STH = gtirb::SerializationTestHarness;
  AuxDataImpl<VectorString> Original =
      std::vector<std::string>({"1", "2", "3"});

  std::stringstream ss;
  STH::save(Original, ss);
  auto Result = STH::load<AuxDataImpl<VectorString>>(Ctx, ss);

  EXPECT_EQ(*Result->get(), std::vector<std::string>({"1", "2", "3"}));
}

TEST(Unit_AuxData, uuidVectorProtobufRoundTrip) {
  using STH = gtirb::SerializationTestHarness;
  UUID Id1 = Node::Create(Ctx)->getUUID(), Id2 = Node::Create(Ctx)->getUUID(),
       Id3 = Node::Create(Ctx)->getUUID();
  AuxDataImpl<VectorUUID> Original = std::vector<UUID>({Id1, Id2, Id3});

  std::stringstream ss;
  STH::save(Original, ss);
  auto Result = STH::load<AuxDataImpl<VectorUUID>>(Ctx, ss);

  EXPECT_EQ(*Result->get(), std::vector<UUID>({Id1, Id2, Id3}));
}

TEST(Unit_AuxData, uuidSetProtobufRoundTrip) {
  using STH = gtirb::SerializationTestHarness;
  UUID Id1 = Node::Create(Ctx)->getUUID(), Id2 = Node::Create(Ctx)->getUUID(),
       Id3 = Node::Create(Ctx)->getUUID();
  AuxDataImpl<SetUUID> Original = std::unordered_set<UUID>({Id1, Id2, Id3});

  std::stringstream ss;
  STH::save(Original, ss);
  auto Result = STH::load<AuxDataImpl<SetUUID>>(Ctx, ss);

  EXPECT_EQ(*Result->get(), std::unordered_set<UUID>({Id1, Id2, Id3}));
  EXPECT_EQ(Result->rawData().ProtobufType, "set<UUID>");
}

TEST(Unit_AuxData, simpleVariantProtobufFirst) {
  using STH = gtirb::SerializationTestHarness;
  uint8_t ui = 1;
  std::variant<uint8_t, int32_t, Addr> Val(ui);
  auto ValOrig = Val;

  AuxDataImpl<SimpleVariant> Original(std::move(Val));
  std::stringstream ss;
  STH::save(Original, ss);

  auto Result = STH::load<AuxDataImpl<SimpleVariant>>(Ctx, ss);
  auto New = *Result->get();

  EXPECT_EQ(New, ValOrig);

  EXPECT_EQ(Result->rawData().ProtobufType, "variant<uint8_t,int32_t,Addr>");
}

TEST(Unit_AuxData, simpleVariantProtobufSecond) {
  using STH = gtirb::SerializationTestHarness;
  int32_t i = -1000;
  std::variant<uint8_t, int32_t, Addr> Val(i);
  auto ValOrig = Val;

  AuxDataImpl<SimpleVariant> Original(std::move(Val));
  std::stringstream ss;
  STH::save(Original, ss);

  auto Result = STH::load<AuxDataImpl<SimpleVariant>>(Ctx, ss);
  auto New = *Result->get();

  EXPECT_EQ(New, ValOrig);

  EXPECT_EQ(Result->rawData().ProtobufType, "variant<uint8_t,int32_t,Addr>");
}

TEST(Unit_AuxData, simpleVariantProtobufThird) {
  using STH = gtirb::SerializationTestHarness;
  Addr addr(0x1234);
  std::variant<uint8_t, int32_t, Addr> Val(addr);
  auto ValOrig = Val;

  AuxDataImpl<SimpleVariant> Original(std::move(Val));
  std::stringstream ss;
  STH::save(Original, ss);

  auto Result = STH::load<AuxDataImpl<SimpleVariant>>(Ctx, ss);
  auto New = *Result->get();

  EXPECT_EQ(New, ValOrig);

  EXPECT_EQ(Result->rawData().ProtobufType, "variant<uint8_t,int32_t,Addr>");
}

TEST(Unit_AuxData, complexVariantProtobufThird) {
  using STH = gtirb::SerializationTestHarness;
  using Map = std::map<std::string, std::vector<int64_t>>;
  Map M{{"a", {1, 2, 3}}};
  std::variant<uint8_t, int32_t, Map> Val(M);
  auto ValOrig = Val;

  AuxDataImpl<ComplexVariant> Original(std::move(Val));
  std::stringstream ss;
  STH::save(Original, ss);

  auto Result = STH::load<AuxDataImpl<ComplexVariant>>(Ctx, ss);
  auto New = *Result->get();

  EXPECT_EQ(New, ValOrig);

  EXPECT_EQ(Result->rawData().ProtobufType,
            "variant<uint8_t,int32_t,mapping<string,sequence<int64_t>>>");
}

TEST(Unit_AuxData, duplicateVariantProtobufFirst) {
  using STH = gtirb::SerializationTestHarness;
  std::variant<uint16_t, int16_t, uint16_t> Val{std::in_place_index<2>, 5};
  auto ValOrig = Val;
  AuxDataImpl<DuplicateVariant> Original(std::move(Val));
  std::stringstream ss;
  STH::save(Original, ss);

  auto Result = STH::load<AuxDataImpl<DuplicateVariant>>(Ctx, ss);
  auto New = *Result->get();
  EXPECT_EQ(New, ValOrig);
  EXPECT_EQ(New.index(), 2);
  EXPECT_EQ(Result->rawData().ProtobufType,
            "variant<uint16_t,int16_t,uint16_t>");
}

TEST(Unit_AuxData, TupleofVariants) {
  using VarT = std::variant<Addr, char>;
  using STH = gtirb::SerializationTestHarness;
  AuxDataImpl<TupleOfCharOrAddr> Original =
      std::tuple<VarT, VarT, VarT>{Addr(0xc0ffee), 'z', '\x1'};
  std::stringstream ss;
  STH::save(Original, ss);
  auto Result = STH::load<AuxDataImpl<TupleOfCharOrAddr>>(Ctx, ss);
  auto T = *Result->get();
  EXPECT_EQ(std::get<0>(T), VarT{Addr(0xc0ffee)});
  EXPECT_EQ(std::get<1>(T), VarT{'z'});
}

TEST(Unit_AuxData, VecOfVariants2) {
  using STH = gtirb::SerializationTestHarness;
  using VariantT = std::variant<Addr, char>;
  AuxDataImpl<VecOfVariants> Original = std::vector<VariantT>{Addr(0xc0ffee)};
  std::stringstream ss;
  STH::save(Original, ss);
  auto Result = STH::load<AuxDataImpl<VecOfVariants>>(Ctx, ss);

  auto V = *Result->get();
  EXPECT_EQ(V.size(), 1);
  EXPECT_EQ(V[0], VariantT(Addr(0xc0ffee)));
}

TEST(Unit_AuxData, VecOfVariants) {
  using STH = gtirb::SerializationTestHarness;
  using VariantT = std::variant<Addr, char>;
  AuxDataImpl<VecOfVariants> Original =
      std::vector<VariantT>{Addr(0xc0ffee), 'z', 'y', Addr(0xfeefaa)};
  std::stringstream ss;
  STH::save(Original, ss);
  auto Result = STH::load<AuxDataImpl<VecOfVariants>>(Ctx, ss);

  auto V = *Result->get();
  EXPECT_EQ(V.size(), 4);
  EXPECT_EQ(V[0], VariantT(Addr(0xc0ffee)));
  EXPECT_EQ(V[2], VariantT('y'));
}

TEST(Unit_AuxData, MapCharToVariant) {
  using STH = gtirb::SerializationTestHarness;
  using VariantT = std::variant<Addr, char>;
  using MapT = std::map<char, VariantT>;

  AuxDataImpl<MapCharToVariant> Original =
      MapT({{'a', Addr(0x1111)}, {'b', 'x'}, {'z', Addr(0xdeadbeef)}});

  std::stringstream ss;
  STH::save(Original, ss);
  auto Result = STH::load<AuxDataImpl<MapCharToVariant>>(Ctx, ss);

  MapT M = *Result->get();
  EXPECT_EQ(M.size(), 3);
  EXPECT_EQ(M['a'], VariantT{Addr(0x1111)});
  EXPECT_EQ(M['b'], VariantT{'x'});
  EXPECT_EQ(M['z'], VariantT{Addr(0xdeadbeef)});
}

TEST(Unit_AuxData, auxdata_traits_type_name) {
  EXPECT_EQ(auxdata_traits<uint64_t>().type_name(), "uint64_t");
  EXPECT_EQ(auxdata_traits<std::vector<uint64_t>>().type_name(),
            "sequence<uint64_t>");
  std::string X = auxdata_traits<std::map<int64_t, uint64_t>>().type_name();
  EXPECT_EQ(X, "mapping<int64_t,uint64_t>");

  X = auxdata_traits<std::map<int64_t, std::vector<uint64_t>>>().type_name();
  EXPECT_EQ(X, "mapping<int64_t,sequence<uint64_t>>");

  X = auxdata_traits<std::vector<std::map<int64_t, uint64_t>>>().type_name();
  EXPECT_EQ(X, "sequence<mapping<int64_t,uint64_t>>");

  X = auxdata_traits<std::vector<std::tuple<int64_t, uint64_t>>>().type_name();
  EXPECT_EQ(X, "sequence<tuple<int64_t,uint64_t>>");

  X = auxdata_traits<std::set<int32_t>>().type_name();
  EXPECT_EQ(X, "set<int32_t>");

  X = auxdata_traits<std::variant<uint8_t, int32_t, Addr>>().type_name();
  EXPECT_EQ(X, "variant<uint8_t,int32_t,Addr>");

  using Map = std::map<std::string, std::vector<int64_t>>;
  X = auxdata_traits<std::variant<uint8_t, int32_t, Map>>().type_name();
  EXPECT_EQ(X, "variant<uint8_t,int32_t,mapping<string,sequence<int64_t>>>");
}

TEST(Unit_AuxData, getPrimitiveTypes) {
  AuxDataImpl<AChar> A = char('a');
  EXPECT_EQ(*A.get(), 'a');

  AuxDataImpl<AUint64> UI64 = uint64_t(123);
  EXPECT_EQ(*UI64.get(), 123);

  AuxDataImpl<AnInt64> SI64 = int64_t(-123);
  EXPECT_EQ(*SI64.get(), -123);

  AuxDataImpl<AnFloat> F32 = float(0.4000000059604645);
  EXPECT_EQ(*F32.get(), 0.4000000059604645);

  AuxDataImpl<AnDouble> F64 = float(1.0);
  EXPECT_EQ(*F64.get(), 1.0);

  AuxDataImpl<AUint8> UI8 = uint8_t(123);
  EXPECT_EQ(*UI8.get(), 123);

  AuxDataImpl<AnInt> SI = int(-123);
  EXPECT_EQ(*SI.get(), -123);

  AuxDataImpl<AnUnsigned> UI = unsigned(123);
  EXPECT_EQ(*UI.get(), 123);

  AuxDataImpl<ABool> Bo = bool(true);
  EXPECT_EQ(*Bo.get(), true);

  AuxDataImpl<AByte> B = std::byte(123);
  EXPECT_EQ(*B.get(), std::byte(123));
}

TEST(Unit_AuxData, getVector) {
  std::vector<int64_t> Orig({1, 2, 3});
  auto Copy = Orig;
  AuxDataImpl<VectorInt64> P(std::move(Copy));

  auto& result = *P.get();
  EXPECT_EQ(result, Orig);
}

TEST(Unit_AuxData, getString) {
  std::string Orig("abcd");
  AuxDataImpl<AString> P(std::move(Orig));

  EXPECT_EQ(*P.get(), "abcd");
}

TEST(Unit_AuxData, getAddr) {
  Addr Orig(0x1234);
  AuxDataImpl<AnAddr> P(std::move(Orig));

  EXPECT_EQ(*P.get(), Addr(0x1234));
}

TEST(Unit_AuxData, getMap) {
  std::map<char, int64_t> Orig({{'a', 1}, {'b', 2}, {'c', 3}});
  auto Copy = Orig;
  AuxDataImpl<MapCharToInt64> P(std::move(Copy));

  auto& Result = *P.get();
  EXPECT_EQ(Result, Orig);
}

TEST(Unit_AuxData, getSet) {
  std::set<int> Orig({1, 2, 3});
  auto Copy = Orig;
  AuxDataImpl<SetOfInt> P(std::move(Copy));

  auto& Result = *P.get();
  EXPECT_EQ(Result, Orig);
}

TEST(Unit_AuxData, getTuple) {
  std::tuple<char, int64_t> Orig('a', 1);
  auto Copy = Orig;
  AuxDataImpl<TupleOfCharAndInt64> P(std::move(Copy));

  auto& Result = *P.get();
  EXPECT_EQ(Result, Orig);
}

TEST(Unit_AuxData, protobufRoundTrip) {
  using STH = gtirb::SerializationTestHarness;
  int64_t A = 123;
  auto Copy = A;
  AuxDataImpl<AnInt64> P(std::move(Copy));

  std::stringstream ss;
  STH::save(P, ss);
  auto Result = STH::load<AuxDataImpl<AnInt64>>(Ctx, ss);

  EXPECT_EQ(A, *Result->get());
}

TEST(Unit_AuxData, vectorProtobufRoundTrip) {
  using STH = gtirb::SerializationTestHarness;
  std::vector<int64_t> V({1, 2, 3});
  auto Copy = V;
  AuxDataImpl<VectorInt64> P(std::move(Copy));

  std::stringstream ss;
  STH::save(P, ss);
  auto Result = STH::load<AuxDataImpl<VectorInt64>>(Ctx, ss);

  EXPECT_EQ(*Result->get(), V);
}

TEST(Unit_AuxData, listProtobufRoundTrip) {
  using STH = gtirb::SerializationTestHarness;
  std::list<int64_t> V({1, 2, 3});
  auto Copy = V;
  AuxDataImpl<ListInt64> P(std::move(Copy));

  std::stringstream ss;
  STH::save(P, ss);
  auto Result = STH::load<AuxDataImpl<ListInt64>>(Ctx, ss);

  EXPECT_EQ(*Result->get(), V);
}

TEST(Unit_AuxData, stringProtobufRoundTrip) {
  using STH = gtirb::SerializationTestHarness;
  std::string S("abcd");
  auto Copy = S;
  AuxDataImpl<AString> P(std::move(Copy));

  std::stringstream ss;
  STH::save(P, ss);
  auto Result = STH::load<AuxDataImpl<AString>>(Ctx, ss);

  EXPECT_EQ(*Result->get(), S);
}

TEST(Unit_AuxData, addrProtobufRoundTrip) {
  using STH = gtirb::SerializationTestHarness;
  Addr A(0x1234);
  auto Copy = A;
  AuxDataImpl<AnAddr> P(std::move(Copy));

  std::stringstream ss;
  STH::save(P, ss);
  auto Result = STH::load<AuxDataImpl<AnAddr>>(Ctx, ss);

  EXPECT_EQ(*Result->get(), A);
}

TEST(Unit_AuxData, mapProtobufRoundTrip) {
  using STH = gtirb::SerializationTestHarness;
  std::map<char, int64_t> M({{'a', 1}, {'b', 2}, {'c', 3}});
  auto Copy = M;
  AuxDataImpl<MapCharToInt64> P(std::move(Copy));

  std::stringstream ss;
  STH::save(P, ss);
  auto Result = STH::load<AuxDataImpl<MapCharToInt64>>(Ctx, ss);

  EXPECT_EQ(*Result->get(), M);
}

TEST(Unit_AuxData, tupleProtobufRoundTrip) {
  using STH = gtirb::SerializationTestHarness;
  std::tuple<char, int64_t> T('a', 1);
  auto Copy = T;
  AuxDataImpl<TupleOfCharAndInt64> P(std::move(Copy));

  std::stringstream ss;
  STH::save(P, ss);
  auto Result = STH::load<AuxDataImpl<TupleOfCharAndInt64>>(Ctx, ss);

  EXPECT_EQ(*Result->get(), T);
}

TEST(Unit_AuxData, pairProtobufRoundTrip) {
  using STH = gtirb::SerializationTestHarness;
  std::pair<char, int64_t> Peer('a', 1);
  auto Copy = Peer;
  AuxDataImpl<PairOfCharAndInt64> P(std::move(Copy));

  std::stringstream ss;
  STH::save(P, ss);
  auto Result = STH::load<AuxDataImpl<PairOfCharAndInt64>>(Ctx, ss);

  EXPECT_EQ(*Result->get(), Peer);
}

TEST(Unit_AuxData, uuidProtobufRoundTrip) {
  using STH = gtirb::SerializationTestHarness;
  UUID Val = Node::Create(Ctx)->getUUID();
  auto Copy = Val;
  AuxDataImpl<AUUID> P(std::move(Copy));

  std::stringstream ss;
  STH::save(P, ss);
  auto Result = STH::load<AuxDataImpl<AUUID>>(Ctx, ss);

  EXPECT_EQ(*Result->get(), Val);
}

TEST(Unit_AuxData, OffsetProtobufRoundTrip) {
  using STH = gtirb::SerializationTestHarness;
  Offset Val{Node::Create(Ctx)->getUUID(), 123};
  auto Copy = Val;
  AuxDataImpl<AnOffset> P(std::move(Copy));

  std::stringstream ss;
  STH::save(P, ss);
  auto Result = STH::load<AuxDataImpl<AnOffset>>(Ctx, ss);

  auto NewVal = *Result->get();
  EXPECT_EQ(NewVal.ElementId, Val.ElementId);
  EXPECT_EQ(NewVal.Displacement, Val.Displacement);
}

TEST(Unit_AuxData, nestedProtobufRoundTrip) {
  using STH = gtirb::SerializationTestHarness;

  // Outer vector
  std::stringstream ss1;
  std::vector<std::map<char, std::tuple<int64_t, uint64_t>>> N1;
  N1.push_back({{'a', {0, 1}}, {'b', {2, 3}}});
  N1.push_back({{'c', {4, 5}}, {'d', {6, 7}}});
  auto Copy1 = N1;
  AuxDataImpl<VectorOfMapOfTuple> Original1 = std::move(Copy1);
  STH::save(Original1, ss1);
  auto Result1 = STH::load<AuxDataImpl<VectorOfMapOfTuple>>(Ctx, ss1);

  EXPECT_EQ(*Result1->get(), N1);

  // Outer map
  std::stringstream ss2;
  std::map<std::string, std::vector<int64_t>> N2{{"a", {1, 2, 3}}};
  auto Copy2 = N2;
  AuxDataImpl<MapOfVector> Original2 = std::move(Copy2);
  STH::save(Original2, ss2);
  auto Result2 = STH::load<AuxDataImpl<MapOfVector>>(Ctx, ss2);

  EXPECT_EQ(*Result2->get(), N2);

  // Outer tuple
  std::stringstream ss3;
  std::tuple<std::string, std::vector<int64_t>> N3{"a", {1, 2, 3}};
  auto Copy3 = N3;
  AuxDataImpl<TupleOfVector> Original3 = std::move(Copy3);
  STH::save(Original3, ss3);
  auto Result3 = STH::load<AuxDataImpl<TupleOfVector>>(Ctx, ss3);

  EXPECT_EQ(*Result3->get(), N3);
}

TEST(Unit_AuxData, wrongTypeAfterProtobufRoundTrip) {
  using STH = gtirb::SerializationTestHarness;
  AuxDataImpl<AnInt32> Original(1234);

  std::stringstream ss;
  STH::save(Original, ss);
  EXPECT_EQ(STH::load<AuxDataImpl<AString>>(Ctx, ss), nullptr);
}

struct MoveTest {
  MoveTest() = default;
  MoveTest(int X) : Val(X) {}
  MoveTest(const MoveTest& other) : Val(other.Val) { CopyCount++; };
  MoveTest(MoveTest&& other) : Val(std::move(other.Val)) { MoveCount++; }
  static int CopyCount;
  static int MoveCount;
  int Val{0};
};
int MoveTest::CopyCount;
int MoveTest::MoveCount;

template <>
struct gtirb::auxdata_traits<MoveTest> : default_serialization<MoveTest> {
  static std::string type_name() { return "MoveTest"; }
};

TEST(Unit_AuxData, movesAndCopies) {
  MoveTest::CopyCount = 0;
  MoveTest::MoveCount = 0;

  MoveTest M(123);
  EXPECT_EQ(MoveTest::CopyCount, 0);
  EXPECT_EQ(MoveTest::MoveCount, 0);

  AuxDataImpl<AMoveTest> AD(std::move(M));
  EXPECT_EQ(AD.get()->Val, 123);
  EXPECT_EQ(MoveTest::CopyCount, 0);
  EXPECT_EQ(MoveTest::MoveCount, 1);
}


================================================
FILE: src/test/AuxDataContainer.test.cpp
================================================
//===- AuxDataContainer.test.cpp --------------------------------*- C++ -*-===//
//
//  Copyright (C) 2020 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
#include "AuxDataContainerSchema.hpp"
#include "Main.test.hpp"
#include "PrepDeathTest.hpp"
#include "SerializationTestHarness.hpp"
#include <gtirb/AuxDataContainer.hpp>
#include <gtirb/Context.hpp>
#include <gtirb/IR.hpp>
#include <gtest/gtest.h>
#include <memory>
#include <sstream>

// Note: Some things are not tested here, since they really need
// multiple processes to test correctly. In particular, it's difficult
// to test how the various methods are supposed to behave when an
// AuxData type is not registered even though a container has
// instances of the type (e.g. from some other process that did have
// those types registered.)

using namespace gtirb;
using namespace gtirb::schema;

Context Ctx;

void registerAuxDataContainerTestAuxDataTypes() {
  AuxDataContainer::registerAuxDataType<RegisteredType>();
  AuxDataContainer::registerAuxDataType<BadDeSerializationType>();
}

#ifndef NDEBUG
TEST(Unit_AuxDataContainerDeathTest, registerSchemaTooLate) {
  // Guarantee that the AuxData TypeMap is locked.
  [[maybe_unused]] auto* Ir = IR::Create(Ctx);

  // It should now be illegal to attempt to add a new AuxData schema.
  {
    [[maybe_unused]] PrepDeathTest PDT;
    EXPECT_DEATH(AuxDataContainer::registerAuxDataType<UnRegisteredType>(),
                 "New AuxData types cannot be added at this point.");
  }
}
#endif

TEST(Unit_AuxDataContainer, addAuxDataRegistered) {
  using STH = gtirb::SerializationTestHarness;
  auto* Ir = IR::Create(Ctx);
  Ir->addAuxData<RegisteredType>(5);

  // Access it immediately?
  {
    const auto* CV =
        static_cast<const gtirb::IR*>(Ir)->getAuxData<RegisteredType>();
    EXPECT_NE(CV, nullptr);
    EXPECT_EQ(*CV, 5);
    auto* V = Ir->getAuxData<RegisteredType>();
    EXPECT_NE(V, nullptr);
    EXPECT_EQ(*V, 5);
  }

  std::stringstream ss;
  STH::save(*Ir, ss);
  Context ResultCtx;
  auto* Result = STH::load<IR>(ResultCtx, ss);
  ASSERT_TRUE(Result);

  // Access it after serialization?
  {
    const auto* CV = Result->getAuxData<RegisteredType>();
    ASSERT_NE(CV, nullptr);
    EXPECT_EQ(*CV, 5);
    auto* V = Result->getAuxData<RegisteredType>();
    ASSERT_NE(V, nullptr);
    EXPECT_EQ(*V, 5);
  }
}

// Test that GTIRB correctly triggers an assertion failure when the client fails
// to register an AuxData schema.
#ifndef NDEBUG
TEST(Unit_AuxDataContainerDeathTest, addAuxDataUnregistered) {
  auto* Ir = IR::Create(Ctx);
  {
    [[maybe_unused]] PrepDeathTest PDT;
    EXPECT_DEATH(
        Ir->addAuxData<UnRegisteredType>(5),
        "Attempting to add AuxData with unregistered or incorrect type.");
  }
}
#endif

// Test that GTIRB correctly triggers an assertion failure when the client tries
// to use a schema that has the same name as a registered schema, but is
// actually a different type.
#ifndef NDEBUG
TEST(Unit_AuxDataContainerDeathTest, addAuxDataDuplicateName) {
  auto* Ir = IR::Create(Ctx);
  {
    [[maybe_unused]] PrepDeathTest PDT;
    EXPECT_DEATH(
        Ir->addAuxData<DuplicateNameType>(5),
        "Attempting to add AuxData with unregistered or incorrect type.");
  }
}
#endif

// Test that GTIRB correctly returns null when attempting to fetch
// AuxData that fails to unserialize.
TEST(Unit_AuxDataContainer, addAuxDataBadUnserialize) {
  using STH = gtirb::SerializationTestHarness;
  auto* Ir = IR::Create(Ctx);
  Ir->addAuxData<BadDeSerializationType>({5, 10});

  std::stringstream ss;
  STH::save(*Ir, ss);
  Context ResultCtx;
  auto* Result = STH::load<IR>(ResultCtx, ss);

  // Access it after serialization?
  {
    const auto* CV = Result->getAuxData<RegisteredType>();
    EXPECT_EQ(CV, nullptr);
  }

  // Should still be present as raw data
  EXPECT_EQ(Result->getAuxDataSize(), 1);
  auto It = Result->aux_data_begin();
  const auto& Raw = *It;
  EXPECT_STREQ(Raw.Key.c_str(), BadDeSerializationType::Name);
  EXPECT_EQ(Raw.ProtobufType,
            auxdata_traits<schema::BadDeSerializationType::Type>::type_name());
  std::string ExpectedBytes = {0x5, 0x0, 0x0, 0x0, 0xA, 0x0, 0x0, 0x0};
  ASSERT_EQ(Raw.RawBytes.size(), ExpectedBytes.size());
  EXPECT_EQ(Raw.RawBytes, ExpectedBytes);
}

// AuxData not present
TEST(Unit_AuxDataContainer, getAuxDataNotPresent) {
  auto* Ir = IR::Create(Ctx);
  EXPECT_EQ(Ir->getAuxData<RegisteredType>(), nullptr);
}

// AuxData present, but accessed w/ incompatible schema
#ifndef NDEBUG
TEST(Unit_AuxDataContainerDeathTest, getAuxDataIncompatibleSchema) {
  auto* Ir = IR::Create(Ctx);
  Ir->addAuxData<RegisteredType>(5);
  {
    [[maybe_unused]] PrepDeathTest PDT;
    EXPECT_DEATH(Ir->getAuxData<DuplicateNameType>(),
                 "Attempting to retrieve AuxData with incorrect type.");
  }
}
#endif

// AuxData present, but accessed w/ unregistered schema
#ifndef NDEBUG
TEST(Unit_AuxDataContainerDeathTest, getAuxDataUnregisteredType) {
  const auto* Ir = getTestIr();
  ASSERT_NE(Ir, nullptr);
  {
    [[maybe_unused]] PrepDeathTest PDT;
    EXPECT_DEATH(Ir->getAuxData<UnRegisteredType>(),
                 "Attempting to retrieve AuxData with an unregistered type.");
  }
}
#endif

// Removing AuxData by schema
TEST(Unit_AuxDataContainer, removeAuxDataBySchema) {
  auto* Ir = IR::Create(Ctx);
  Ir->addAuxData<RegisteredType>(5);
  const auto* CV = Ir->getAuxData<RegisteredType>();
  ASSERT_NE(CV, nullptr);
  EXPECT_EQ(*CV, 5);
  EXPECT_TRUE(Ir->removeAuxData<RegisteredType>());
  EXPECT_EQ(Ir->getAuxData<RegisteredType>(), nullptr);
  EXPECT_FALSE(Ir->removeAuxData<RegisteredType>());
}

// Removing AuxData by name
TEST(Unit_AuxDataContainer, removeAuxDataByName) {
  auto* Ir = IR::Create(Ctx);
  Ir->addAuxData<RegisteredType>(5);
  const auto* CV = Ir->getAuxData<RegisteredType>();
  ASSERT_NE(CV, nullptr);
  EXPECT_EQ(*CV, 5);
  EXPECT_TRUE(Ir->removeAuxData("registered type"));
  EXPECT_EQ(Ir->getAuxData<RegisteredType>(), nullptr);
  EXPECT_FALSE(Ir->removeAuxData("registered type"));
}

// Removing unregistered AuxData
#ifndef NDEBUG
TEST(Unit_AuxDataContainerDeathTest, removeAuxDataUnregistered) {
  auto* Ir = IR::Create(Ctx);
  {
    [[maybe_unused]] PrepDeathTest PDT;
    EXPECT_DEATH(Ir->removeAuxData<UnRegisteredType>(),
                 "Attempting to remove AuxData with an unregistered type.");
  }
}
#endif

// Iteration and container size
TEST(Unit_AuxDataContainer, iteration) {
  auto* Ir = IR::Create(Ctx);

  EXPECT_TRUE(Ir->getAuxDataEmpty());
  EXPECT_EQ(Ir->getAuxDataSize(), 0);

  Ir->addAuxData<RegisteredType>(5);
  Ir->addAuxData<BadDeSerializationType>({10, 20});

  EXPECT_FALSE(Ir->getAuxDataEmpty());
  EXPECT_EQ(Ir->getAuxDataSize(), 2);

  // begin/end
  bool SawRegistered = false;
  bool SawBad = false;
  for (auto It = Ir->aux_data_begin(); It != Ir->aux_data_end(); ++It) {
    if (It->Key == RegisteredType::Name) {
      SawRegistered = true;
    } else if (It->Key == BadDeSerializationType::Name) {
      SawBad = true;
    } else {
      EXPECT_TRUE(false);
    }
  }
  EXPECT_TRUE(SawRegistered);
  EXPECT_TRUE(SawBad);

  // Check that the range version gives us the same start and end
  // points.
  EXPECT_EQ(Ir->aux_data_begin(), Ir->aux_data().begin());
  EXPECT_EQ(Ir->aux_data_end(), Ir->aux_data().end());

  // Remove everything.
  Ir->clearAuxData();
  EXPECT_TRUE(Ir->getAuxDataEmpty());
  EXPECT_EQ(Ir->getAuxDataSize(), 0);
  EXPECT_EQ(Ir->aux_data_begin(), Ir->aux_data_end());
  EXPECT_TRUE(Ir->aux_data().empty());
}


================================================
FILE: src/test/AuxDataContainerSchema.hpp
================================================
#ifndef AUX_DATA_CONTAINER_SCHEMA_HPP
#define AUX_DATA_CONTAINER_SCHEMA_HPP

#include <gtirb/AuxData.hpp>
#include <cstdint>

// Schema for AuxDataContainer's unit tests

namespace gtirb {
namespace schema {

struct RegisteredType {
  static constexpr const char* Name = "registered type";
  typedef int64_t Type;
};

struct UnRegisteredType {
  static constexpr const char* Name = "unregistered type";
  typedef int64_t Type;
};

struct DuplicateNameType {
  static constexpr const char* Name = "registered type";
  typedef int32_t Type;
};

struct BadDeSerializationType {
  static constexpr const char* Name = "bad deserialization type";
  typedef struct {
    int32_t x;
    int32_t y;
  } Type;
};

} // namespace schema

// The BadDeSerializationType schema will serialize but will fail to
// deserialize. This models several situations that a client of
// GTIRB might be in:
//
// 1) They incorrectly implement their custom auxdata_traits<> for
// their custom schema.
//
// 2) They are processing a GTIRB file generated by a different
// client that used an incompatible schema. In which case, when they
// attempt to unserialize the AuxData, it will fail to unserialize
// even though they have a schema registered for it.
//
// 3) They are processing a GTIRB file that's just outright corrupted.
template <> struct auxdata_traits<schema::BadDeSerializationType::Type> {
  using T = schema::BadDeSerializationType::Type;
  static void toBytes(const T& Object, ToByteRange& TBR) {
    // Store as little-endian.
    T reversed = boost::endian::conditional_reverse<
        boost::endian::order::little, boost::endian::order::native>(Object);
    auto srcBytes_begin = reinterpret_cast<std::byte*>(&reversed);
    auto srcBytes_end = reinterpret_cast<std::byte*>(&reversed + 1);
    std::for_each(srcBytes_begin, srcBytes_end, [&](auto b) { TBR.write(b); });
  }

  static bool fromBytes(T& Object [[maybe_unused]],
                        FromByteRange& FBR [[maybe_unused]]) {
    // Fail to deserialize.
    return false;
  }

  static std::string type_name() { return "badbadbad"; }
};

} // namespace gtirb

#endif // AUX_DATA_CONTAINER_SCHEMA_HPP


================================================
FILE: src/test/AuxDataSchemaRegistration.test.cpp
================================================
// Note: this file tests schema registration for AuxData. It is
// purposely built as a separate test program so that we can keep the
// type map unlocked. This means, one can write tests that register
// schema, but one should *not* write tests that actually involve
// constructing GTIRB IR.

// Note also: Because schema registration is global, keeping this file
// to a single unit test explicitly guarantees ordering in the state
// of the registration.

#include "AuxDataContainerSchema.hpp"
#include "PrepDeathTest.hpp"
#include <gtirb/AuxDataContainer.hpp>
#include <gtest/gtest.h>

using namespace gtirb;
using namespace schema;

#ifndef NDEBUG
TEST(Unit_AuxDataContainerDeathTest, SchemaRegistration) {
  AuxDataContainer::registerAuxDataType<RegisteredType>();

  // Able to re-register the same schema with no error.
  AuxDataContainer::registerAuxDataType<RegisteredType>();

  // Assertion if registering a second schema w/ duplicate name but
  // incompatibable type.
  {
    [[maybe_unused]] PrepDeathTest PDT;
    EXPECT_DEATH(AuxDataContainer::registerAuxDataType<DuplicateNameType>(),
                 "Different types registered for the same AuxData name.");
  }
}
#endif


================================================
FILE: src/test/ByteInterval.test.cpp
================================================
//===- Block.test.cpp -------------------------------------------*- C++ -*-===//
//
//  Copyright (C) 2020 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
#include "SerializationTestHarness.hpp"
#include "TestHelpers.hpp"
#include <gtirb/ByteInterval.hpp>
#include <gtirb/Context.hpp>
#include <gtirb/IR.hpp>
#include <gtirb/Symbol.hpp>
#include <gtirb/proto/ByteInterval.pb.h>
#include <gtest/gtest.h>
#include <sstream>

using namespace gtirb;

static Context Ctx;

TEST(Unit_ByteInterval, compilationIteratorTypes) {
  static_assert(std::is_same_v<ByteInterval::block_iterator::reference, Node&>);
  static_assert(std::is_same_v<ByteInterval::const_block_iterator::reference,
                               const Node&>);
  static_assert(
      std::is_same_v<ByteInterval::block_subrange::iterator::reference, Node&>);
  static_assert(
      std::is_same_v<ByteInterval::const_block_subrange::iterator::reference,
                     const Node&>);

  {
    ByteInterval::block_iterator BIt;
    ByteInterval::const_block_iterator CBIt(BIt);
    CBIt = BIt;

    ByteInterval::block_range BRng;
    ByteInterval::const_block_range CBRng(BRng);
    CBRng = BRng;

    ByteInterval::block_subrange BSubRng;
    ByteInterval::const_block_subrange CBSubRng(BSubRng);
    CBSubRng = BSubRng;
  }
  static_assert(!std::is_convertible_v<ByteInterval::const_block_iterator,
                                       ByteInterval::block_iterator>);
  static_assert(!std::is_convertible_v<ByteInterval::const_block_range,
                                       ByteInterval::block_range>);
  static_assert(!std::is_convertible_v<ByteInterval::const_block_subrange,
                                       ByteInterval::block_subrange>);
}

TEST(Unit_ByteInterval, noCopyMoveConstructors) {
  EXPECT_FALSE(std::is_copy_constructible_v<ByteInterval>);
  EXPECT_FALSE(std::is_move_constructible_v<ByteInterval>);
  EXPECT_FALSE(std::is_copy_assignable_v<ByteInterval>);
  EXPECT_FALSE(std::is_move_assignable_v<ByteInterval>);
}

TEST(Unit_ByteInterval, ctor) {
  EXPECT_NE(ByteInterval::Create(Ctx, Addr(1), 100), nullptr);
}

TEST(Unit_ByteInterval, gettersSetters) {
  auto* BI = ByteInterval::Create(Ctx, std::optional<Addr>(), 2);
  EXPECT_EQ(std::optional<Addr>(), BI->getAddress());
  EXPECT_EQ(2, BI->getSize());
  EXPECT_EQ(2, BI->getInitializedSize());
  EXPECT_EQ(BI->getSection(), nullptr);

  BI->setAddress(Addr(1));
  EXPECT_EQ(std::optional<Addr>(1), BI->getAddress());
  EXPECT_EQ(2, BI->getSize());
  EXPECT_EQ(2, BI->getInitializedSize());
  EXPECT_EQ(BI->getSection(), nullptr);

  BI->setSize(10);
  EXPECT_EQ(std::optional<Addr>(1), BI->getAddress());
  EXPECT_EQ(10, BI->getSize());
  EXPECT_EQ(2, BI->getInitializedSize());
  EXPECT_EQ(BI->getSection(), nullptr);

  BI->setInitializedSize(5);
  EXPECT_EQ(std::optional<Addr>(1), BI->getAddress());
  EXPECT_EQ(10, BI->getSize());
  EXPECT_EQ(5, BI->getInitializedSize());
  EXPECT_EQ(BI->getSection(), nullptr);

  BI->setSize(1);
  EXPECT_EQ(std::optional<Addr>(1), BI->getAddress());
  EXPECT_EQ(1, BI->getSize());
  EXPECT_EQ(1, BI->getInitializedSize());
  EXPECT_EQ(BI->getSection(), nullptr);

  BI->setInitializedSize(20);
  EXPECT_EQ(std::optional<Addr>(1), BI->getAddress());
  EXPECT_EQ(20, BI->getSize());
  EXPECT_EQ(20, BI->getInitializedSize());
  EXPECT_EQ(BI->getSection(), nullptr);
}

TEST(Unit_ByteInterval, protobufRoundTrip) {
  using STH = gtirb::SerializationTestHarness;
  // Test with fixed address.
  {
    std::stringstream ss;
    {
      Context InnerCtx;
      auto* Original = ByteInterval::Create(InnerCtx, Addr(1), 2);
      STH::save(*Original, ss);
    }
    auto* Result = STH::load<ByteInterval>(Ctx, ss);

    EXPECT_EQ(Result->getAddress(), std::optional<Addr>(1));
    EXPECT_EQ(Result->getSize(), 2);
    EXPECT_EQ(Result->getSection(), nullptr);
  }

  // Test without fixed address.
  {
    std::stringstream ss;
    {
      Context InnerCtx;
      auto* Original = ByteInterval::Create(InnerCtx, std::optional<Addr>(), 2);
      STH::save(*Original, ss);
    }
    auto* Result = STH::load<ByteInterval>(Ctx, ss);

    EXPECT_EQ(Result->getAddress(), std::optional<Addr>());
    EXPECT_EQ(Result->getSize(), 2);
    EXPECT_EQ(Result->getSection(), nullptr);
  }

  // Test with bytes.
  {
    std::stringstream ss;
    {
      Context InnerCtx;
      std::string Contents = "abcd";
      auto* Original = ByteInterval::Create(InnerCtx, std::optional<Addr>(),
                                            Contents.begin(), Contents.end());
      STH::save(*Original, ss);
    }
    auto* Result = STH::load<ByteInterval>(Ctx, ss);

    EXPECT_EQ(Result->getAddress(), std::optional<Addr>());
    EXPECT_EQ(Result->getSize(), 4);
    EXPECT_EQ(Result->getInitializedSize(), 4);
    EXPECT_EQ(Result->getSection(), nullptr);

    {
      std::string ResultBytes;
      auto It = Result->bytes_begin<char>();
      std::copy(It, It + Result->getSize(), std::back_inserter(ResultBytes));
      EXPECT_EQ(ResultBytes, "abcd");
    }
    // Try with different endianness.
    // For fetching bytes this should not matter, but a bug in boost 1.67
    // broke this for <char> and endian::order::big, prior to 2021-03 fix.
    {
      std::string ResultBytes;
      auto It = Result->bytes_begin<char>(boost::endian::order::little);
      std::copy(It, It + Result->getSize(), std::back_inserter(ResultBytes));
      EXPECT_EQ(ResultBytes, "abcd");
    }
    {
      std::string ResultBytes;
      auto It = Result->bytes_begin<char>(boost::endian::order::big);
      std::copy(It, It + Result->getSize(), std::back_inserter(ResultBytes));
      EXPECT_EQ(ResultBytes, "abcd");
    }
    {
      std::string ResultBytes;
      auto It = Result->bytes_begin<signed char>(boost::endian::order::big);
      std::copy(It, It + Result->getSize(), std::back_inserter(ResultBytes));
      EXPECT_EQ(ResultBytes, "abcd");
    }
    {
      std::string ResultBytes;
      auto It = Result->bytes_begin<unsigned char>(boost::endian::order::big);
      std::copy(It, It + Result->getSize(), std::back_inserter(ResultBytes));
      EXPECT_EQ(ResultBytes, "abcd");
    }
    {
      std::string ResultBytes;
      auto It = Result->bytes_begin<int8_t>(boost::endian::order::big);
      std::copy(It, It + Result->getSize(), std::back_inserter(ResultBytes));
      EXPECT_EQ(ResultBytes, "abcd");
    }
    {
      std::string ResultBytes;
      auto It = Result->bytes_begin<uint8_t>(boost::endian::order::big);
      std::copy(It, It + Result->getSize(), std::back_inserter(ResultBytes));
      EXPECT_EQ(ResultBytes, "abcd");
    }
    // vector<byte>
    {
      std::vector<std::byte> ResultBytes;
      auto It = Result->bytes_begin<std::byte>(boost::endian::order::little);
      std::copy(It, It + Result->getSize(), std::back_inserter(ResultBytes));
      EXPECT_EQ(ResultBytes.at(0), std::byte{'a'});
      EXPECT_EQ(ResultBytes.at(1), std::byte{'b'});
      EXPECT_EQ(ResultBytes.at(2), std::byte{'c'});
      EXPECT_EQ(ResultBytes.at(3), std::byte{'d'});
    }
    {
      std::vector<std::byte> ResultBytes;
      auto It = Result->bytes_begin<std::byte>(boost::endian::order::big);
      std::copy(It, It + Result->getSize(), std::back_inserter(ResultBytes));
      EXPECT_EQ(ResultBytes.at(0), std::byte{'a'});
      EXPECT_EQ(ResultBytes.at(1), std::byte{'b'});
      EXPECT_EQ(ResultBytes.at(2), std::byte{'c'});
      EXPECT_EQ(ResultBytes.at(3), std::byte{'d'});
    }

    // Try fetching shorts, assumed to be 16-bit, with different endianness.
    // These were added to confirm that the boost bug for <char> above did not
    // affect shorts and int16s.
    assert(sizeof(short) == sizeof(int16_t));
    {
      std::vector<int16_t> ResultShorts;
      auto It = Result->bytes_begin<int16_t>(boost::endian::order::little);
      std::copy(It, It + Result->getSize() / sizeof(int16_t),
                std::back_inserter(ResultShorts));
      EXPECT_EQ(ResultShorts.at(0), 0x6261); // 'b','a'
      EXPECT_EQ(ResultShorts.at(1), 0x6463); // 'd','c'
    }
    {
      std::vector<uint16_t> ResultShorts;
      auto It = Result->bytes_begin<uint16_t>(boost::endian::order::little);
      std::copy(It, It + Result->getSize() / sizeof(uint16_t),
                std::back_inserter(ResultShorts));
      EXPECT_EQ(ResultShorts.at(0), 0x6261); // 'b','a'
      EXPECT_EQ(ResultShorts.at(1), 0x6463); // 'd','c'
    }
    {
      std::vector<short> ResultShorts;
      auto It = Result->bytes_begin<short>(boost::endian::order::little);
      std::copy(It, It + Result->getSize() / sizeof(short),
                std::back_inserter(ResultShorts));
      EXPECT_EQ(ResultShorts.at(0), 0x6261); // 'b','a'
      EXPECT_EQ(ResultShorts.at(1), 0x6463); // 'd','c'
    }
    {
      std::vector<signed short> ResultShorts;
      auto It = Result->bytes_begin<signed short>(boost::endian::order::little);
      std::copy(It, It + Result->getSize() / sizeof(signed short),
                std::back_inserter(ResultShorts));
      EXPECT_EQ(ResultShorts.at(0), 0x6261); // 'b','a'
      EXPECT_EQ(ResultShorts.at(1), 0x6463); // 'd','c'
    }
    {
      std::vector<unsigned short> ResultShorts;
      auto It =
          Result->bytes_begin<unsigned short>(boost::endian::order::little);
      std::copy(It, It + Result->getSize() / sizeof(unsigned short),
                std::back_inserter(ResultShorts));
      EXPECT_EQ(ResultShorts.at(0), 0x6261); // 'b','a'
      EXPECT_EQ(ResultShorts.at(1), 0x6463); // 'd','c'
    }
    {
      std::vector<int16_t> ResultShorts;
      auto It = Result->bytes_begin<int16_t>(boost::endian::order::big);
      std::copy(It, It + Result->getSize() / sizeof(int16_t),
                std::back_inserter(ResultShorts));
      EXPECT_EQ(ResultShorts.at(0), 0x6162); // 'a','b'
      EXPECT_EQ(ResultShorts.at(1), 0x6364); // 'c','d'
    }
    {
      std::vector<uint16_t> ResultShorts;
      auto It = Result->bytes_begin<uint16_t>(boost::endian::order::big);
      std::copy(It, It + Result->getSize() / sizeof(uint16_t),
                std::back_inserter(ResultShorts));
      EXPECT_EQ(ResultShorts.at(0), 0x6162); // 'a','b'
      EXPECT_EQ(ResultShorts.at(1), 0x6364); // 'c','d'
    }
    {
      std::vector<short> ResultShorts;
      auto It = Result->bytes_begin<short>(boost::endian::order::big);
      std::copy(It, It + Result->getSize() / sizeof(short),
                std::back_inserter(ResultShorts));
      EXPECT_EQ(ResultShorts.at(0), 0x6162); // 'a','b'
      EXPECT_EQ(ResultShorts.at(1), 0x6364); // 'c','d'
    }
    {
      std::vector<signed short> ResultShorts;
      auto It = Result->bytes_begin<signed short>(boost::endian::order::big);
      std::copy(It, It + Result->getSize() / sizeof(signed short),
                std::back_inserter(ResultShorts));
      EXPECT_EQ(ResultShorts.at(0), 0x6162); // 'a','b'
      EXPECT_EQ(ResultShorts.at(1), 0x6364); // 'c','d'
    }
    {
      std::vector<unsigned short> ResultShorts;
      auto It = Result->bytes_begin<unsigned short>(boost::endian::order::big);
      std::copy(It, It + Result->getSize() / sizeof(unsigned short),
                std::back_inserter(ResultShorts));
      EXPECT_EQ(ResultShorts.at(0), 0x6162); // 'a','b'
      EXPECT_EQ(ResultShorts.at(1), 0x6364); // 'c','d'
    }
  }

  // Test truncating of unallocated bytes.
  {
    std::stringstream ss;
    {
      Context InnerCtx;
      std::string Contents = "abcd";
      auto* Original =
          ByteInterval::Create(InnerCtx, std::optional<Addr>(),
                               Contents.begin(), Contents.end(), 4, 2);
      STH::save(*Original, ss);
    }
    auto* Result = STH::load<ByteInterval>(Ctx, ss);

    EXPECT_EQ(Result->getAddress(), std::optional<Addr>());
    EXPECT_EQ(Result->getSize(), 4);
    EXPECT_EQ(Result->getInitializedSize(), 2);
    EXPECT_EQ(Result->getSection(), nullptr);

    std::string ResultBytes;
    std::copy(Result->bytes_begin<char>(), Result->bytes_end<char>(),
              std::back_inserter(ResultBytes));
    // Explode the string comparison, because the default one for std::string
    // does not like embedded NULs whatsoever.
    ASSERT_EQ(ResultBytes.size(), 4);
    ASSERT_EQ(ResultBytes[0], 'a');
    ASSERT_EQ(ResultBytes[1], 'b');
    ASSERT_EQ(ResultBytes[2], '\0');
    ASSERT_EQ(ResultBytes[3], '\0');
  }

  // Test with subobjects.
  {
    auto* Sym = Symbol::Create(Ctx, "test");

    std::stringstream ss;
    {
      Context InnerCtx;
      auto* Original = ByteInterval::Create(InnerCtx, Addr(0), 10);
      Original->addBlock<CodeBlock>(InnerCtx, 3, 1);
      Original->addBlock<CodeBlock>(InnerCtx, 6, 1);
      Original->addBlock<DataBlock>(InnerCtx, 6, 1);
      Original->addSymbolicExpression<SymAddrConst>(5, 8, Sym);
      STH::save(*Original, ss);
    }
    // Copy the stream so we can read from it a second time to do the
    // symbolic expressions.
    std::stringstream ss2;
    ss2 << ss.str();
    auto* Result = STH::load<ByteInterval>(Ctx, ss);

    EXPECT_EQ(std::distance(Result->blocks_begin(), Result->blocks_end()), 3);
    EXPECT_EQ(
        std::distance(Result->code_blocks_begin(), Result->code_blocks_end()),
        2);
    EXPECT_EQ(
        std::distance(Result->data_blocks_begin(), Result->data_blocks_end()),
        1);
    // Only after symbolicExpressionsFromProtobuf will sym exprs be populated.
    EXPECT_EQ(std::distance(Result->symbolic_expressions_begin(),
                            Result->symbolic_expressions_end()),
              0);

    constexpr auto getOffset = [](const Node& N) -> uint64_t {
      if (auto* B = dyn_cast_or_null<CodeBlock>(&N)) {
        return B->getOffset();
      }
      if (auto* D = dyn_cast_or_null<DataBlock>(&N)) {
        return D->getOffset();
      }
      assert(!"Found a non-block in a byte interval!");
      return 0;
    };

    EXPECT_EQ(getOffset(*Result->blocks_begin()), 3);
    EXPECT_EQ(getOffset(*std::next(Result->blocks_begin())), 6);
    EXPECT_EQ(getOffset(*std::next(std::next(Result->blocks_begin()))), 6);

    EXPECT_EQ(Result->code_blocks_begin()->getOffset(), 3);
    EXPECT_EQ(std::next(Result->code_blocks_begin())->getOffset(), 6);

    EXPECT_EQ(Result->data_blocks_begin()->getOffset(), 6);

    // Populate the sym exprs now.
    EXPECT_TRUE(STH::byteIntervalLoadSymbolicExpressions(Ctx, *Result, ss2));
    EXPECT_EQ(std::distance(Result->symbolic_expressions_begin(),
                            Result->symbolic_expressions_end()),
              1);

    EXPECT_EQ(Result->symbolic_expressions_begin()->getByteInterval(), Result);
    EXPECT_EQ(Result->symbolic_expressions_begin()->getOffset(), 5);
    EXPECT_TRUE(std::holds_alternative<SymAddrConst>(
        Result->symbolic_expressions_begin()->getSymbolicExpression()));
    EXPECT_EQ(std::get<SymAddrConst>(
                  Result->symbolic_expressions_begin()->getSymbolicExpression())
                  .Offset,
              8);
    EXPECT_EQ(std::get<SymAddrConst>(
                  Result->symbolic_expressions_begin()->getSymbolicExpression())
                  .Sym,
              Sym);
  }
}

TEST(Unit_ByteInterval, byteVector) {
  std::string Contents = "hello, world!";

  // Test all allocated bytes.
  {
    auto* BI = ByteInterval::Create(Ctx, std::optional<Addr>(),
                                    Contents.begin(), Contents.end());
    EXPECT_EQ(BI->getSize(), Contents.size());

    auto OriginalIt = Contents.begin();
    auto NewIt = BI->bytes_begin<char>();
    auto OriginalEnd = Contents.end();
    auto NewEnd = BI->bytes_end<char>();

    while (OriginalIt != OriginalEnd && NewIt != NewEnd) {
      EXPECT_EQ(*OriginalIt, *NewIt);
      ++OriginalIt;
      ++NewIt;
    }
    EXPECT_EQ(OriginalIt, OriginalEnd);
    EXPECT_EQ(NewIt, NewEnd);
  }

  // Test some unallocated bytes.
  {
    auto* BI = ByteInterval::Create(Ctx, std::optional<Addr>(),
                                    Contents.begin(), Contents.end(), 100);
    EXPECT_EQ(BI->getSize(), 100);

    auto OriginalIt = Contents.begin();
    auto NewIt = BI->bytes_begin<char>();
    auto OriginalEnd = Contents.end();
    auto NewEnd = BI->bytes_end<char>();

    while (OriginalIt != OriginalEnd && NewIt != NewEnd) {
      EXPECT_EQ(*OriginalIt, *NewIt);
      ++OriginalIt;
      ++NewIt;
    }
    EXPECT_EQ(OriginalIt, OriginalEnd);
    EXPECT_NE(NewIt, NewEnd);

    while (NewIt != NewEnd) {
      EXPECT_EQ(*NewIt, '\0');
      ++NewIt;
    }
    EXPECT_EQ(std::distance(BI->bytes_begin<char>(), NewIt), 100);
  }
}

template <typename T> static T str2(const char* S) {
  // TODO: is an endian conversion needed here?
  return *(const T*)S;
}

TEST(Unit_ByteInterval, byteVectorInts) {
  std::string Contents = "hello, world!!??";
  auto* BI = ByteInterval::Create(Ctx, std::optional<Addr>(), Contents.begin(),
                                  Contents.end());
  EXPECT_EQ(Contents.size(), 16);

  // 16 bits
  {
    std::vector<uint16_t> CompareTo = {
        str2<uint16_t>("he"), str2<uint16_t>("ll"), str2<uint16_t>("o,"),
        str2<uint16_t>(" w"), str2<uint16_t>("or"), str2<uint16_t>("ld"),
        str2<uint16_t>("!!"), str2<uint16_t>("??")};

    auto OriginalIt = CompareTo.begin();
    auto NewIt = BI->bytes_begin<uint16_t>();
    auto OriginalEnd = CompareTo.end();
    auto NewEnd = BI->bytes_end<uint16_t>();

    EXPECT_EQ(std::distance(NewIt, NewEnd), 8);
    while (OriginalIt != OriginalEnd && NewIt != NewEnd) {
      EXPECT_EQ(*OriginalIt, *NewIt);
      ++OriginalIt;
      ++NewIt;
    }
    EXPECT_EQ(OriginalIt, OriginalEnd);
    EXPECT_EQ(NewIt, NewEnd);
  }

  // 32 bits
  {
    std::vector<uint32_t> CompareTo = {
        str2<uint32_t>("hell"), str2<uint32_t>("o, w"), str2<uint32_t>("orld"),
        str2<uint32_t>("!!??")};

    auto OriginalIt = CompareTo.begin();
    auto NewIt = BI->bytes_begin<uint32_t>();
    auto OriginalEnd = CompareTo.end();
    auto NewEnd = BI->bytes_end<uint32_t>();

    EXPECT_EQ(std::distance(NewIt, NewEnd), 4);
    while (OriginalIt != OriginalEnd && NewIt != NewEnd) {
      EXPECT_EQ(*OriginalIt, *NewIt);
      ++OriginalIt;
      ++NewIt;
    }
    EXPECT_EQ(OriginalIt, OriginalEnd);
    EXPECT_EQ(NewIt, NewEnd);
  }

  // 64 bits
  {
    std::vector<uint64_t> CompareTo = {str2<uint64_t>("hello, w"),
                                       str2<uint64_t>("orld!!??")};

    auto OriginalIt = CompareTo.begin();
    auto NewIt = BI->bytes_begin<uint64_t>();
    auto OriginalEnd = CompareTo.end();
    auto NewEnd = BI->bytes_end<uint64_t>();

    EXPECT_EQ(std::distance(NewIt, NewEnd), 2);
    while (OriginalIt != OriginalEnd && NewIt != NewEnd) {
      EXPECT_EQ(*OriginalIt, *NewIt);
      ++OriginalIt;
      ++NewIt;
    }
    EXPECT_EQ(OriginalIt, OriginalEnd);
    EXPECT_EQ(NewIt, NewEnd);
  }
}

TEST(Unit_ByteInterval, byteVectorEndian) {
  std::string Contents = "hello, world!!??";
  auto* BI = ByteInterval::Create(Ctx, std::optional<Addr>(), Contents.begin(),
                                  Contents.end());
  EXPECT_EQ(Contents.size(), 16);

  // Test using little endian.
  {
    std::vector<uint16_t> CompareTo = {
        str2<uint16_t>("he"), str2<uint16_t>("ll"), str2<uint16_t>("o,"),
        str2<uint16_t>(" w"), str2<uint16_t>("or"), str2<uint16_t>("ld"),
        str2<uint16_t>("!!"), str2<uint16_t>("??")};

    auto OriginalIt = CompareTo.begin();
    auto NewIt = BI->bytes_begin<uint16_t>(boost::endian::order::little);
    auto OriginalEnd = CompareTo.end();
    auto NewEnd = BI->bytes_end<uint16_t>(boost::endian::order::little);

    EXPECT_EQ(std::distance(NewIt, NewEnd), 8);
    while (OriginalIt != OriginalEnd && NewIt != NewEnd) {
      EXPECT_EQ(*OriginalIt, *NewIt);
      ++OriginalIt;
      ++NewIt;
    }
    EXPECT_EQ(OriginalIt, OriginalEnd);
    EXPECT_EQ(NewIt, NewEnd);
  }

  // Test using big endian.
  {
    std::vector<uint16_t> CompareTo = {
        str2<uint16_t>("eh"), str2<uint16_t>("ll"), str2<uint16_t>(",o"),
        str2<uint16_t>("w "), str2<uint16_t>("ro"), str2<uint16_t>("dl"),
        str2<uint16_t>("!!"), str2<uint16_t>("??")};

    auto OriginalIt = CompareTo.begin();
    auto NewIt = BI->bytes_begin<uint16_t>(boost::endian::order::big);
    auto OriginalEnd = CompareTo.end();
    auto NewEnd = BI->bytes_end<uint16_t>(boost::endian::order::big);

    EXPECT_EQ(std::distance(NewIt, NewEnd), 8);
    while (OriginalIt != OriginalEnd && NewIt != NewEnd) {
      EXPECT_EQ(*OriginalIt, *NewIt);
      ++OriginalIt;
      ++NewIt;
    }
    EXPECT_EQ(OriginalIt, OriginalEnd);
    EXPECT_EQ(NewIt, NewEnd);
  }
}

TEST(Unit_ByteInterval, byteVectorInsert) {
  std::string Contents = "0123456789";
  auto* BI = ByteInterval::Create(Ctx, std::optional<Addr>(), Contents.begin(),
                                  Contents.end());
  {
    char charInsert = 'd';
    BI->insertBytes<char>(BI->bytes_begin<char>(), charInsert);
    const gtirb::ByteInterval& CBI(*BI);
    BI->insertBytes(CBI.bytes_begin<char>(), charInsert);
    std::string toInsert = "abc";
    BI->insertBytes<char>(BI->bytes_begin<char>(), toInsert.begin(),
                          toInsert.end());
    std::string Result;
    std::copy(BI->bytes_begin<char>(), BI->bytes_end<char>(),
              std::back_inserter(Result));
    ASSERT_EQ(Result, "abcdd0123456789");
  }

  {
    std::string toInsert = "efg";
    BI->insertBytes<char>(BI->bytes_begin<char>() + 7, toInsert.begin(),
                          toInsert.end());
    std::string Result;
    std::copy(BI->bytes_begin<char>(), BI->bytes_end<char>(),
              std::back_inserter(Result));
    ASSERT_EQ(Result, "abcdd01efg23456789");
  }

  {
    std::string toInsert = "hi";
    BI->insertBytes<char>(BI->bytes_end<char>(), toInsert.begin(),
                          toInsert.end());
    std::string Result;
    std::copy(BI->bytes_begin<char>(), BI->bytes_end<char>(),
              std::back_inserter(Result));
    ASSERT_EQ(Result, "abcdd01efg23456789hi");
  }

  // Test with larger, non-char values.
  {
    std::vector<uint32_t> toInsert = {str2<uint32_t>("(hel"),
                                      str2<uint32_t>("lo.)")};
    BI->insertBytes<uint32_t>(BI->bytes_begin<uint32_t>() + 1, toInsert.begin(),
                              toInsert.end());
    std::string Result;
    std::copy(BI->bytes_begin<char>(), BI->bytes_end<char>(),
              std::back_inserter(Result));
    ASSERT_EQ(Result, "abcd(hello.)d01efg23456789hi");
  }
}

TEST(Unit_ByteInterval, byteVectorErase) {
  std::string Contents = "0123456789";
  auto* BI = ByteInterval::Create(Ctx, std::optional<Addr>(), Contents.begin(),
                                  Contents.end());

  {
    BI->eraseBytes<char>(BI->bytes_begin<char>(), BI->bytes_begin<char>() + 2);
    std::string Result;
    std::copy(BI->bytes_begin<char>(), BI->bytes_end<char>(),
              std::back_inserter(Result));
    ASSERT_EQ(Result, "23456789");
  }

  {
    BI->eraseBytes<char>(BI->bytes_begin<char>() + 4,
                         BI->bytes_begin<char>() + 5);
    std::string Result;
    std::copy(BI->bytes_begin<char>(), BI->bytes_end<char>(),
              std::back_inserter(Result));
    ASSERT_EQ(Result, "2345789");
  }

  {
    BI->eraseBytes<char>(BI->bytes_begin<char>() + 6, BI->bytes_end<char>());
    std::string Result;
    std::copy(BI->bytes_begin<char>(), BI->bytes_end<char>(),
              std::back_inserter(Result));
    ASSERT_EQ(Result, "234578");
  }

  // Test larger value types.
  {
    BI->eraseBytes<uint16_t>(BI->bytes_begin<uint16_t>() + 1,
                             BI->bytes_begin<uint16_t>() + 2);
    std::string Result;
    std::copy(BI->bytes_begin<char>(), BI->bytes_end<char>(),
              std::back_inserter(Result));
    ASSERT_EQ(Result, "2378");
  }

  // Test clearing the bytes.
  {
    BI->eraseBytes<uint32_t>(BI->bytes_begin<uint32_t>(),
                             BI->bytes_end<uint32_t>());
    std::string Result;
    std::copy(BI->bytes_begin<char>(), BI->bytes_end<char>(),
              std::back_inserter(Result));
    ASSERT_EQ(Result, "");
  }
}

TEST(Unit_ByteInterval, removeBlock) {
  auto* BI = ByteInterval::Create(Ctx, Addr(0), 10);

  auto* B1 = BI->addBlock<CodeBlock>(Ctx, 0, 1);
  auto* B2 = BI->addBlock<DataBlock>(Ctx, 1, 1);
  auto* B3 = BI->addBlock<CodeBlock>(Ctx, 2, 1);
  auto* B4 = BI->addBlock<DataBlock>(Ctx, 3, 1);

  {
    auto Begin = BI->code_blocks_begin(), End = BI->code_blocks_end();
    ASSERT_EQ(std::distance(Begin, End), 2);
    ASSERT_NE(std::find_if(Begin, End, [&](const auto& N) { return B1 == &N; }),
              End);
    ASSERT_NE(std::find_if(Begin, End, [&](const auto& N) { return B3 == &N; }),
              End);
  }

  {
    auto Begin = BI->data_blocks_begin(), End = BI->data_blocks_end();
    ASSERT_EQ(std::distance(Begin, End), 2);
    ASSERT_NE(std::find_if(Begin, End, [&](const auto& N) { return B2 == &N; }),
              End);
    ASSERT_NE(std::find_if(Begin, End, [&](const auto& N) { return B4 == &N; }),
              End);
  }

  BI->removeBlock(B1);

  {
    auto Begin = BI->code_blocks_begin(), End = BI->code_blocks_end();
    ASSERT_EQ(std::distance(Begin, End), 1);
    ASSERT_NE(std::find_if(Begin, End, [&](const auto& N) { return B3 == &N; }),
              End);
  }

  {
    auto Begin = BI->data_blocks_begin(), End = BI->data_blocks_end();
    ASSERT_EQ(std::distance(Begin, End), 2);
    ASSERT_NE(std::find_if(Begin, End, [&](const auto& N) { return B2 == &N; }),
              End);
    ASSERT_NE(std::find_if(Begin, End, [&](const auto& N) { return B4 == &N; }),
              End);
  }

  BI->removeBlock(B2);

  {
    auto Begin = BI->code_blocks_begin(), End = BI->code_blocks_end();
    ASSERT_EQ(std::distance(Begin, End), 1);
    ASSERT_NE(std::find_if(Begin, End, [&](const auto& N) { return B3 == &N; }),
              End);
  }

  {
    auto Begin = BI->data_blocks_begin(), End = BI->data_blocks_end();
    ASSERT_EQ(std::distance(Begin, End), 1);
    ASSERT_NE(std::find_if(Begin, End, [&](const auto& N) { return B4 == &N; }),
              End);
  }
}

TEST(Unit_ByteInterval, addSymbolicExpression) {
  auto* BI = ByteInterval::Create(Ctx, std::optional<Addr>(), 10);
  auto* S = Symbol::Create(Ctx, "test");

  {
    auto& SE = BI->addSymbolicExpression(0, SymAddrConst{1, S});
    ASSERT_TRUE(std::holds_alternative<SymAddrConst>(SE));
    ASSERT_EQ(std::get<SymAddrConst>(SE).Offset, 1);
    ASSERT_EQ(std::get<SymAddrConst>(SE).Sym, S);
  }

  {
    auto& SE = BI->addSymbolicExpression(1, SymAddrAddr{3, 4, S, S});
    ASSERT_TRUE(std::holds_alternative<SymAddrAddr>(SE));
    ASSERT_EQ(std::get<SymAddrAddr>(SE).Scale, 3);
    ASSERT_EQ(std::get<SymAddrAddr>(SE).Offset, 4);
    ASSERT_EQ(std::get<SymAddrAddr>(SE).Sym1, S);
    ASSERT_EQ(std::get<SymAddrAddr>(SE).Sym2, S);
  }

  {
    auto& SE = BI->addSymbolicExpression(2, SymAddrConst{4, S});
    ASSERT_TRUE(std::holds_alternative<SymAddrConst>(SE));
    ASSERT_EQ(std::get<SymAddrConst>(SE).Offset, 4);
    ASSERT_EQ(std::get<SymAddrConst>(SE).Sym, S);
  }

  {
    auto& SE = BI->addSymbolicExpression(3, SymAddrAddr{6, 7, S, S});
    ASSERT_TRUE(std::holds_alternative<SymAddrAddr>(SE));
    ASSERT_EQ(std::get<SymAddrAddr>(SE).Scale, 6);
    ASSERT_EQ(std::get<SymAddrAddr>(SE).Offset, 7);
    ASSERT_EQ(std::get<SymAddrAddr>(SE).Sym1, S);
    ASSERT_EQ(std::get<SymAddrAddr>(SE).Sym2, S);
  }

  {
    auto Range = BI->symbolic_expressions();
    ASSERT_EQ(std::distance(Range.begin(), Range.end()), 4);
    for (uint64_t i = 0; i < 4; ++i)
      EXPECT_EQ(std::next(Range.begin(), i)->getOffset(), i);
  }
}

TEST(Unit_ByteInterval, updateSymbolicExpression) {
  auto* BI = ByteInterval::Create(Ctx, std::optional<Addr>(), 10);
  auto* S = Symbol::Create(Ctx, "test");
  BI->addSymbolicExpression(0, SymAddrConst{1, S});

  auto& SE = BI->addSymbolicExpression(0, SymAddrConst{2, S});
  ASSERT_TRUE(std::holds_alternative<SymAddrConst>(SE));
  ASSERT_EQ(std::get<SymAddrConst>(SE).Offset, 2);
}

TEST(Unit_ByteInterval, findSymbolicExpressionsAtOffset) {
  auto* BI = ByteInterval::Create(Ctx, 10);
  auto* S1 = Symbol::Create(Ctx, "A");
  BI->addSymbolicExpression(2, SymAddrConst{0, S1});

  auto Range = BI->findSymbolicExpressionsAtOffset(2);
  ASSERT_EQ(std::distance(Range.begin(), Range.end()), 1);

  auto FoundSymbolicExpressionElement = Range.front();
  const SymbolicExpression* SE =
      &FoundSymbolicExpressionElement.getSymbolicExpression();
  ASSERT_TRUE(std::holds_alternative<SymAddrConst>(*SE));
  EXPECT_EQ(std::get<SymAddrConst>(*SE).Offset, 0);
  EXPECT_EQ(std::get<SymAddrConst>(*SE).Sym, S1);

  Range = BI->findSymbolicExpressionsAtOffset(4);
  ASSERT_EQ(std::distance(Range.begin(), Range.end()), 0);

  Range = BI->findSymbolicExpressionsAtOffset(6);
  ASSERT_TRUE(Range.empty());

  Range = BI->findSymbolicExpressionsAtOffset(0, 10);
  ASSERT_EQ(std::distance(Range.begin(), Range.end()), 1);

  FoundSymbolicExpressionElement = Range.front();
  SE = &FoundSymbolicExpressionElement.getSymbolicExpression();
  ASSERT_TRUE(std::holds_alternative<SymAddrConst>(*SE));
  EXPECT_EQ(std::get<SymAddrConst>(*SE).Sym, S1);
}

TEST(Unit_ByteInterval, removeSymbolicExpression) {
  auto* BI = ByteInterval::Create(Ctx, 10);
  auto* S = Symbol::Create(Ctx, "test");
  BI->addSymbolicExpression(5, SymAddrConst{0, S});

  ASSERT_FALSE(BI->symbolic_expressions().empty());

  BI->removeSymbolicExpression(5);

  EXPECT_TRUE(BI->symbolic_expressions().empty());
}

TEST(Unit_ByteInterval, findBlocksOn) {
  auto* BI = ByteInterval::Create(Ctx, 10);
  auto* B1 = BI->addBlock<CodeBlock>(Ctx, 0, 2);
  auto* B2 = BI->addBlock<CodeBlock>(Ctx, 5, 3);
  const ByteInterval* CBI = BI;

  // Querying an out-of-bounds offset produces an empty range.

  auto BlockOffsetRange = BI->findBlocksOnOffset(10);
  EXPECT_TRUE(BlockOffsetRange.empty());

  auto ConstBlockOffsetRange = CBI->findBlocksOnOffset(10);
  EXPECT_TRUE(ConstBlockOffsetRange.empty());

  // Querying an in-bounds offset returns the appropriate block.

  BlockOffsetRange = BI->findBlocksOnOffset(6);
  ASSERT_EQ(std::distance(BlockOffsetRange.begin(), BlockOffsetRange.end()), 1);
  EXPECT_EQ(&*BlockOffsetRange.begin(), B2);

  ConstBlockOffsetRange = CBI->findBlocksOnOffset(6);
  ASSERT_EQ(
      std::distance(ConstBlockOffsetRange.begin(), ConstBlockOffsetRange.end()),
      1);
  EXPECT_EQ(&*ConstBlockOffsetRange.begin(), B2);

  // Address queries produce empty ranges if the ByteInterval has no address.

  auto BlockAddrRange = BI->findBlocksOn(Addr(6));
  EXPECT_TRUE(BlockAddrRange.empty());

  auto ConstBlockAddrRange = CBI->findBlocksOn(Addr(6));
  EXPECT_TRUE(ConstBlockAddrRange.empty());

  // Once the ByteInterval has an address, address queries are non-empty.

  BI->setAddress(Addr(0));
  BlockAddrRange = BI->findBlocksOn(Addr(6));
  ASSERT_EQ(std::distance(BlockAddrRange.begin(), BlockAddrRange.end()), 1);
  EXPECT_EQ(&*BlockAddrRange.begin(), B2);

  ConstBlockAddrRange = CBI->findBlocksOn(Addr(6));
  ASSERT_EQ(
      std::distance(ConstBlockAddrRange.begin(), ConstBlockAddrRange.end()), 1);
  EXPECT_EQ(&*ConstBlockAddrRange.begin(), B2);

  // If the address changes, the returned blocks may change.

  BI->setAddress(Addr(5));
  BlockAddrRange = BI->findBlocksOn(Addr(6));
  ASSERT_EQ(std::distance(BlockAddrRange.begin(), BlockAddrRange.end()), 1);
  EXPECT_EQ(&*BlockAddrRange.begin(), B1);

  ConstBlockAddrRange = CBI->findBlocksOn(Addr(6));
  ASSERT_EQ(
      std::distance(ConstBlockAddrRange.begin(), ConstBlockAddrRange.end()), 1);
  EXPECT_EQ(&*ConstBlockAddrRange.begin(), B1);

  // Querying offsets is not affected by address changes.

  BlockOffsetRange = BI->findBlocksOnOffset(6);
  ASSERT_EQ(std::distance(BlockOffsetRange.begin(), BlockOffsetRange.end()), 1);
  EXPECT_EQ(&*BlockOffsetRange.begin(), B2);

  ConstBlockOffsetRange = CBI->findBlocksOnOffset(6);
  ASSERT_EQ(
      std::distance(ConstBlockOffsetRange.begin(), ConstBlockOffsetRange.end()),
      1);
  EXPECT_EQ(&*ConstBlockOffsetRange.begin(), B2);

  // If the block size changes, queries will be affected.

  B1->setSize(10);

  BlockOffsetRange = BI->findBlocksOnOffset(6);
  ASSERT_EQ(std::distance(BlockOffsetRange.begin(), BlockOffsetRange.end()), 2);
  EXPECT_EQ(&*std::next(BlockOffsetRange.begin(), 0), B1);
  EXPECT_EQ(&*std::next(BlockOffsetRange.begin(), 1), B2);

  ConstBlockOffsetRange = CBI->findBlocksOnOffset(6);
  ASSERT_EQ(
      std::distance(ConstBlockOffsetRange.begin(), ConstBlockOffsetRange.end()),
      2);
  EXPECT_EQ(&*std::next(ConstBlockOffsetRange.begin(), 0), B1);
  EXPECT_EQ(&*std::next(ConstBlockOffsetRange.begin(), 1), B2);
}

TEST(Unit_ByteInterval, findCodeBlocksOn) {
  auto* BI = ByteInterval::Create(Ctx, 10);
  auto* B1 = BI->addBlock<CodeBlock>(Ctx, 0, 2);
  auto* B2 = BI->addBlock<CodeBlock>(Ctx, 5, 3);
  const ByteInterval* CBI = BI;

  // Querying an out-of-bounds offset produces an empty range.

  auto BlockOffsetRange = BI->findCodeBlocksOnOffset(10);
  EXPECT_TRUE(BlockOffsetRange.empty());

  auto ConstBlockOffsetRange = CBI->findCodeBlocksOnOffset(10);
  EXPECT_TRUE(ConstBlockOffsetRange.empty());

  // Querying an in-bounds offset returns the appropriate block.

  BlockOffsetRange = BI->findCodeBlocksOnOffset(6);
  ASSERT_EQ(std::distance(BlockOffsetRange.begin(), BlockOffsetRange.end()), 1);
  EXPECT_EQ(&*BlockOffsetRange.begin(), B2);

  ConstBlockOffsetRange = CBI->findCodeBlocksOnOffset(6);
  ASSERT_EQ(
      std::distance(ConstBlockOffsetRange.begin(), ConstBlockOffsetRange.end()),
      1);
  EXPECT_EQ(&*ConstBlockOffsetRange.begin(), B2);

  // Address queries produce empty ranges if the ByteInterval has no address.

  auto BlockAddrRange = BI->findCodeBlocksOn(Addr(6));
  EXPECT_TRUE(BlockAddrRange.empty());

  auto ConstBlockAddrRange = CBI->findCodeBlocksOn(Addr(6));
  EXPECT_TRUE(ConstBlockAddrRange.empty());

  // Once the ByteInterval has an address, address queries are non-empty.

  BI->setAddress(Addr(0));
  BlockAddrRange = BI->findCodeBlocksOn(Addr(6));
  ASSERT_EQ(std::distance(BlockAddrRange.begin(), BlockAddrRange.end()), 1);
  EXPECT_EQ(&*BlockAddrRange.begin(), B2);

  ConstBlockAddrRange = CBI->findCodeBlocksOn(Addr(6));
  ASSERT_EQ(
      std::distance(ConstBlockAddrRange.begin(), ConstBlockAddrRange.end()), 1);
  EXPECT_EQ(&*ConstBlockAddrRange.begin(), B2);

  // If the address changes, the returned blocks may change.

  BI->setAddress(Addr(5));
  BlockAddrRange = BI->findCodeBlocksOn(Addr(6));
  ASSERT_EQ(std::distance(BlockAddrRange.begin(), BlockAddrRange.end()), 1);
  EXPECT_EQ(&*BlockAddrRange.begin(), B1);

  ConstBlockAddrRange = CBI->findCodeBlocksOn(Addr(6));
  ASSERT_EQ(
      std::distance(ConstBlockAddrRange.begin(), ConstBlockAddrRange.end()), 1);
  EXPECT_EQ(&*ConstBlockAddrRange.begin(), B1);

  // Querying offsets is not affected by address changes.

  BlockOffsetRange = BI->findCodeBlocksOnOffset(6);
  ASSERT_EQ(std::distance(BlockOffsetRange.begin(), BlockOffsetRange.end()), 1);
  EXPECT_EQ(&*BlockOffsetRange.begin(), B2);

  ConstBlockOffsetRange = CBI->findCodeBlocksOnOffset(6);
  ASSERT_EQ(
      std::distance(ConstBlockOffsetRange.begin(), ConstBlockOffsetRange.end()),
      1);
  EXPECT_EQ(&*ConstBlockOffsetRange.begin(), B2);

  // If the block size changes, queries will be affected.

  B1->setSize(10);

  BlockOffsetRange = BI->findCodeBlocksOnOffset(6);
  ASSERT_EQ(std::distance(BlockOffsetRange.begin(), BlockOffsetRange.end()), 2);
  EXPECT_EQ(&*std::next(BlockOffsetRange.begin(), 0), B1);
  EXPECT_EQ(&*std::next(BlockOffsetRange.begin(), 1), B2);

  ConstBlockOffsetRange = CBI->findCodeBlocksOnOffset(6);
  ASSERT_EQ(
      std::distance(ConstBlockOffsetRange.begin(), ConstBlockOffsetRange.end()),
      2);
  EXPECT_EQ(&*std::next(ConstBlockOffsetRange.begin(), 0), B1);
  EXPECT_EQ(&*std::next(ConstBlockOffsetRange.begin(), 1), B2);
}

TEST(Unit_ByteInterval, findDataBlocksOn) {
  auto* BI = ByteInterval::Create(Ctx, 10);
  auto* B1 = BI->addBlock<DataBlock>(Ctx, 0, 2);
  auto* B2 = BI->addBlock<DataBlock>(Ctx, 5, 3);
  const ByteInterval* CBI = BI;

  // Querying an out-of-bounds offset produces an empty range.

  auto BlockOffsetRange = BI->findDataBlocksOnOffset(10);
  EXPECT_TRUE(BlockOffsetRange.empty());

  auto ConstBlockOffsetRange = CBI->findDataBlocksOnOffset(10);
  EXPECT_TRUE(ConstBlockOffsetRange.empty());

  // Querying an in-bounds offset returns the appropriate block.

  BlockOffsetRange = BI->findDataBlocksOnOffset(6);
  ASSERT_EQ(std::distance(BlockOffsetRange.begin(), BlockOffsetRange.end()), 1);
  EXPECT_EQ(&*BlockOffsetRange.begin(), B2);

  ConstBlockOffsetRange = CBI->findDataBlocksOnOffset(6);
  ASSERT_EQ(
      std::distance(ConstBlockOffsetRange.begin(), ConstBlockOffsetRange.end()),
      1);
  EXPECT_EQ(&*ConstBlockOffsetRange.begin(), B2);

  // Address queries produce empty ranges if the ByteInterval has no address.

  auto BlockAddrRange = BI->findDataBlocksOn(Addr(6));
  EXPECT_TRUE(BlockAddrRange.empty());

  auto ConstBlockAddrRange = CBI->findDataBlocksOn(Addr(6));
  EXPECT_TRUE(ConstBlockAddrRange.empty());

  // Once the ByteInterval has an address, address queries are non-empty.

  BI->setAddress(Addr(0));
  BlockAddrRange = BI->findDataBlocksOn(Addr(6));
  ASSERT_EQ(std::distance(BlockAddrRange.begin(), BlockAddrRange.end()), 1);
  EXPECT_EQ(&*BlockAddrRange.begin(), B2);

  ConstBlockAddrRange = CBI->findDataBlocksOn(Addr(6));
  ASSERT_EQ(
      std::distance(ConstBlockAddrRange.begin(), ConstBlockAddrRange.end()), 1);
  EXPECT_EQ(&*ConstBlockAddrRange.begin(), B2);

  // If the address changes, the returned blocks may change.

  BI->setAddress(Addr(5));
  BlockAddrRange = BI->findDataBlocksOn(Addr(6));
  ASSERT_EQ(std::distance(BlockAddrRange.begin(), BlockAddrRange.end()), 1);
  EXPECT_EQ(&*BlockAddrRange.begin(), B1);

  ConstBlockAddrRange = CBI->findDataBlocksOn(Addr(6));
  ASSERT_EQ(
      std::distance(ConstBlockAddrRange.begin(), ConstBlockAddrRange.end()), 1);
  EXPECT_EQ(&*ConstBlockAddrRange.begin(), B1);

  // Querying offsets is not affected by address changes.

  BlockOffsetRange = BI->findDataBlocksOnOffset(6);
  ASSERT_EQ(std::distance(BlockOffsetRange.begin(), BlockOffsetRange.end()), 1);
  EXPECT_EQ(&*BlockOffsetRange.begin(), B2);

  ConstBlockOffsetRange = CBI->findDataBlocksOnOffset(6);
  ASSERT_EQ(
      std::distance(ConstBlockOffsetRange.begin(), ConstBlockOffsetRange.end()),
      1);
  EXPECT_EQ(&*ConstBlockOffsetRange.begin(), B2);

  // If the block size changes, queries will be affected.

  B1->setSize(10);

  BlockOffsetRange = BI->findDataBlocksOnOffset(6);
  ASSERT_EQ(std::distance(BlockOffsetRange.begin(), BlockOffsetRange.end()), 2);
  EXPECT_EQ(&*std::next(BlockOffsetRange.begin(), 0), B1);
  EXPECT_EQ(&*std::next(BlockOffsetRange.begin(), 1), B2);

  ConstBlockOffsetRange = CBI->findDataBlocksOnOffset(6);
  ASSERT_EQ(
      std::distance(ConstBlockOffsetRange.begin(), ConstBlockOffsetRange.end()),
      2);
  EXPECT_EQ(&*std::next(ConstBlockOffsetRange.begin(), 0), B1);
  EXPECT_EQ(&*std::next(ConstBlockOffsetRange.begin(), 1), B2);
}

TEST(Unit_ByteInterval, findBlocksAt) {
  auto* BI = ByteInterval::Create(Ctx, 10);
  auto* B1 = BI->addBlock<CodeBlock>(Ctx, 0, 2);
  auto* B2 = BI->addBlock<CodeBlock>(Ctx, 5, 3);
  const ByteInterval* CBI = BI;

  // Methods return empty ranges if ByteInterval has no address.

  auto BlockRange = BI->findBlocksAt(Addr(0));
  EXPECT_TRUE(BlockRange.empty());

  auto ConstBlockRange = CBI->findBlocksAt(Addr(0));
  EXPECT_TRUE(ConstBlockRange.empty());

  BlockRange =
      BI->findBlocksAt(Addr(0), Addr(static_cast<Addr::value_type>(-1)));
  EXPECT_TRUE(BlockRange.empty());

  ConstBlockRange =
      CBI->findBlocksAt(Addr(0), Addr(static_cast<Addr::value_type>(-1)));
  EXPECT_TRUE(BlockRange.empty());

  // Once the address is set, the ranges are no longer empty.

  BI->setAddress(Addr(0));
  BlockRange = BI->findBlocksAt(Addr(5));
  ASSERT_EQ(std::distance(BlockRange.begin(), BlockRange.end()), 1);
  EXPECT_EQ(&*BlockRange.begin(), B2);

  ConstBlockRange = CBI->findBlocksAt(Addr(5));
  ASSERT_EQ(std::distance(ConstBlockRange.begin(), ConstBlockRange.end()), 1);
  EXPECT_EQ(&*ConstBlockRange.begin(), B2);

  // Changing the ByteInterval address changes which blocks are found.

  BI->setAddress(Addr(5));
  BlockRange = BI->findBlocksAt(Addr(5));
  ASSERT_EQ(std::distance(BlockRange.begin(), BlockRange.end()), 1);
  EXPECT_EQ(&*BlockRange.begin(), B1);

  ConstBlockRange = CBI->findBlocksAt(Addr(5));
  ASSERT_EQ(std::distance(ConstBlockRange.begin(), ConstBlockRange.end()), 1);
  EXPECT_EQ(&*ConstBlockRange.begin(), B1);

  // Method returns empty range if no block starts at address.

  EXPECT_TRUE(BI->findBlocksAt(Addr(0)).empty());
  EXPECT_TRUE(BI->findBlocksAt(Addr(7)).empty());
  EXPECT_TRUE(BI->findBlocksAt(Addr(15)).empty());

  EXPECT_TRUE(CBI->findBlocksAt(Addr(0)).empty());
  EXPECT_TRUE(CBI->findBlocksAt(Addr(7)).empty());
  EXPECT_TRUE(CBI->findBlocksAt(Addr(15)).empty());

  // Querying a range of addreses that start before and/or ends after the
  // ByteInterval is equivalent to querying the ByteInterval's bounds.

  BlockRange = BI->findBlocksAt(Addr(0), Addr(20));
  ASSERT_EQ(std::distance(BlockRange.begin(), BlockRange.end()), 2);
  EXPECT_EQ(pointers(BlockRange),
            pointers(BI->findBlocksAt(*BI->getAddress(),
                                      *BI->getAddress() + BI->getSize())));
  EXPECT_EQ(&*std::next(BlockRange.begin(), 0), B1);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 1), B2);

  ConstBlockRange = CBI->findBlocksAt(Addr(0), Addr(20));
  ASSERT_EQ(std::distance(ConstBlockRange.begin(), ConstBlockRange.end()), 2);
  EXPECT_EQ(pointers(ConstBlockRange),
            pointers(CBI->findBlocksAt(*BI->getAddress(),
                                       *BI->getAddress() + BI->getSize())));
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 0), B1);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 1), B2);

  // Order matters: querying an empty range produces an empty result.

  BlockRange = BI->findBlocksAt(Addr(20), Addr(0));
  EXPECT_TRUE(BlockRange.empty());

  ConstBlockRange = CBI->findBlocksAt(Addr(20), Addr(0));
  EXPECT_TRUE(ConstBlockRange.empty());
}

TEST(Unit_ByteInterval, findCodeBlocksAt) {
  auto* BI = ByteInterval::Create(Ctx, 10);
  auto* B1 = BI->addBlock<CodeBlock>(Ctx, 0, 2);
  auto* B2 = BI->addBlock<CodeBlock>(Ctx, 5, 3);
  const ByteInterval* CBI = BI;

  // Methods return empty ranges if ByteInterval has no address.

  auto BlockRange = BI->findCodeBlocksAt(Addr(0));
  EXPECT_TRUE(BlockRange.empty());

  auto ConstBlockRange = CBI->findCodeBlocksAt(Addr(0));
  EXPECT_TRUE(ConstBlockRange.empty());

  BlockRange =
      BI->findCodeBlocksAt(Addr(0), Addr(static_cast<Addr::value_type>(-1)));
  EXPECT_TRUE(BlockRange.empty());

  ConstBlockRange =
      CBI->findCodeBlocksAt(Addr(0), Addr(static_cast<Addr::value_type>(-1)));
  EXPECT_TRUE(BlockRange.empty());

  // Once the address is set, the ranges are no longer empty.

  BI->setAddress(Addr(0));
  BlockRange = BI->findCodeBlocksAt(Addr(5));
  ASSERT_EQ(std::distance(BlockRange.begin(), BlockRange.end()), 1);
  EXPECT_EQ(&*BlockRange.begin(), B2);

  ConstBlockRange = CBI->findCodeBlocksAt(Addr(5));
  ASSERT_EQ(std::distance(ConstBlockRange.begin(), ConstBlockRange.end()), 1);
  EXPECT_EQ(&*ConstBlockRange.begin(), B2);

  // Changing the ByteInterval address changes which blocks are found.

  BI->setAddress(Addr(5));
  BlockRange = BI->findCodeBlocksAt(Addr(5));
  ASSERT_EQ(std::distance(BlockRange.begin(), BlockRange.end()), 1);
  EXPECT_EQ(&*BlockRange.begin(), B1);

  ConstBlockRange = CBI->findCodeBlocksAt(Addr(5));
  ASSERT_EQ(std::distance(ConstBlockRange.begin(), ConstBlockRange.end()), 1);
  EXPECT_EQ(&*ConstBlockRange.begin(), B1);

  // Method returns empty range if no block starts at address.

  EXPECT_TRUE(BI->findCodeBlocksAt(Addr(0)).empty());
  EXPECT_TRUE(BI->findCodeBlocksAt(Addr(7)).empty());
  EXPECT_TRUE(BI->findCodeBlocksAt(Addr(15)).empty());

  EXPECT_TRUE(CBI->findCodeBlocksAt(Addr(0)).empty());
  EXPECT_TRUE(CBI->findCodeBlocksAt(Addr(7)).empty());
  EXPECT_TRUE(CBI->findCodeBlocksAt(Addr(15)).empty());

  // Querying a range of addreses that start before and/or ends after the
  // ByteInterval is equivalent to querying the ByteInterval's bounds.

  BlockRange = BI->findCodeBlocksAt(Addr(0), Addr(20));
  ASSERT_EQ(std::distance(BlockRange.begin(), BlockRange.end()), 2);
  EXPECT_EQ(pointers(BlockRange),
            pointers(BI->findCodeBlocksAt(*BI->getAddress(),
                                          *BI->getAddress() + BI->getSize())));
  EXPECT_EQ(&*std::next(BlockRange.begin(), 0), B1);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 1), B2);

  ConstBlockRange = CBI->findCodeBlocksAt(Addr(0), Addr(20));
  ASSERT_EQ(std::distance(ConstBlockRange.begin(), ConstBlockRange.end()), 2);
  EXPECT_EQ(pointers(ConstBlockRange),
            pointers(CBI->findCodeBlocksAt(*BI->getAddress(),
                                           *BI->getAddress() + BI->getSize())));
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 0), B1);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 1), B2);

  // Order matters: querying an empty range produces an empty result.

  BlockRange = BI->findCodeBlocksAt(Addr(20), Addr(0));
  EXPECT_TRUE(BlockRange.empty());

  ConstBlockRange = CBI->findCodeBlocksAt(Addr(20), Addr(0));
  EXPECT_TRUE(ConstBlockRange.empty());
}

TEST(Unit_ByteInterval, findDataBlocksAt) {
  auto* BI = ByteInterval::Create(Ctx, 10);
  auto* B1 = BI->addBlock<DataBlock>(Ctx, 0, 2);
  auto* B2 = BI->addBlock<DataBlock>(Ctx, 5, 3);
  const ByteInterval* CBI = BI;

  // Methods return empty ranges if ByteInterval has no address.

  auto BlockRange = BI->findDataBlocksAt(Addr(0));
  EXPECT_TRUE(BlockRange.empty());

  auto ConstBlockRange = CBI->findDataBlocksAt(Addr(0));
  EXPECT_TRUE(ConstBlockRange.empty());

  BlockRange =
      BI->findDataBlocksAt(Addr(0), Addr(static_cast<Addr::value_type>(-1)));
  EXPECT_TRUE(BlockRange.empty());

  ConstBlockRange =
      CBI->findDataBlocksAt(Addr(0), Addr(static_cast<Addr::value_type>(-1)));
  EXPECT_TRUE(BlockRange.empty());

  // Once the address is set, the ranges are no longer empty.

  BI->setAddress(Addr(0));
  BlockRange = BI->findDataBlocksAt(Addr(5));
  ASSERT_EQ(std::distance(BlockRange.begin(), BlockRange.end()), 1);
  EXPECT_EQ(&*BlockRange.begin(), B2);

  ConstBlockRange = CBI->findDataBlocksAt(Addr(5));
  ASSERT_EQ(std::distance(ConstBlockRange.begin(), ConstBlockRange.end()), 1);
  EXPECT_EQ(&*ConstBlockRange.begin(), B2);

  // Changing the ByteInterval address changes which blocks are found.

  BI->setAddress(Addr(5));
  BlockRange = BI->findDataBlocksAt(Addr(5));
  ASSERT_EQ(std::distance(BlockRange.begin(), BlockRange.end()), 1);
  EXPECT_EQ(&*BlockRange.begin(), B1);

  ConstBlockRange = CBI->findDataBlocksAt(Addr(5));
  ASSERT_EQ(std::distance(ConstBlockRange.begin(), ConstBlockRange.end()), 1);
  EXPECT_EQ(&*ConstBlockRange.begin(), B1);

  // Method returns empty range if no block starts at address.

  EXPECT_TRUE(BI->findDataBlocksAt(Addr(0)).empty());
  EXPECT_TRUE(BI->findDataBlocksAt(Addr(7)).empty());
  EXPECT_TRUE(BI->findDataBlocksAt(Addr(15)).empty());

  EXPECT_TRUE(CBI->findDataBlocksAt(Addr(0)).empty());
  EXPECT_TRUE(CBI->findDataBlocksAt(Addr(7)).empty());
  EXPECT_TRUE(CBI->findDataBlocksAt(Addr(15)).empty());

  // Querying a range of addreses that start before and/or ends after the
  // ByteInterval is equivalent to querying the ByteInterval's bounds.

  BlockRange = BI->findDataBlocksAt(Addr(0), Addr(20));
  ASSERT_EQ(std::distance(BlockRange.begin(), BlockRange.end()), 2);
  EXPECT_EQ(pointers(BlockRange),
            pointers(BI->findDataBlocksAt(*BI->getAddress(),
                                          *BI->getAddress() + BI->getSize())));
  EXPECT_EQ(&*std::next(BlockRange.begin(), 0), B1);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 1), B2);

  ConstBlockRange = CBI->findDataBlocksAt(Addr(0), Addr(20));
  ASSERT_EQ(std::distance(ConstBlockRange.begin(), ConstBlockRange.end()), 2);
  EXPECT_EQ(pointers(ConstBlockRange),
            pointers(CBI->findDataBlocksAt(*BI->getAddress(),
                                           *BI->getAddress() + BI->getSize())));
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 0), B1);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 1), B2);

  // Order matters: querying an empty range produces an empty result.

  BlockRange = BI->findDataBlocksAt(Addr(20), Addr(0));
  EXPECT_TRUE(BlockRange.empty());

  ConstBlockRange = CBI->findDataBlocksAt(Addr(20), Addr(0));
  EXPECT_TRUE(ConstBlockRange.empty());
}

TEST(Unit_ByteInterval, moveBlock) {
  auto* I = IR::Create(Ctx);
  auto* M = I->addModule(Ctx, "test");
  auto* PB = M->addProxyBlock(Ctx);
  auto* S = M->addSection(Ctx, ".text");
  auto* BI = S->addByteInterval(Ctx, 10);
  auto* CB = BI->addBlock<CodeBlock>(Ctx, 0, 2);
  auto* DB = BI->addBlock<DataBlock>(Ctx, 0, 2);

  addEdge(CB, PB, I->getCFG());
  EXPECT_EQ(boost::num_edges(I->getCFG()), 1);

  EXPECT_EQ(CB->getOffset(), 0);
  EXPECT_EQ(BI->addBlock(5, CB), ChangeStatus::Accepted);
  EXPECT_EQ(CB->getOffset(), 5);

  EXPECT_EQ(DB->getOffset(), 0);
  EXPECT_EQ(BI->addBlock(5, DB), ChangeStatus::Accepted);
  EXPECT_EQ(DB->getOffset(), 5);

  EXPECT_EQ(BI->addBlock(5, CB), ChangeStatus::NoChange);
  EXPECT_EQ(BI->addBlock(5, DB), ChangeStatus::NoChange);

  EXPECT_EQ(boost::num_edges(I->getCFG()), 1);
}

TEST(Unit_ByteInterval, moveBlockIndices) {
  auto* BI = ByteInterval::Create(Ctx, Addr{0}, 10);
  auto* CB = BI->addBlock<CodeBlock>(Ctx, 0, 2);
  auto* DB = BI->addBlock<DataBlock>(Ctx, 0, 2);

  {
    auto Range = BI->findBlocksOn(Addr{0});
    EXPECT_EQ(std::distance(Range.begin(), Range.end()), 2);
  }

  {
    auto Range = BI->findBlocksOn(Addr{5});
    EXPECT_EQ(std::distance(Range.begin(), Range.end()), 0);
  }

  EXPECT_EQ(BI->addBlock(5, CB), ChangeStatus::Accepted);
  EXPECT_EQ(BI->addBlock(5, DB), ChangeStatus::Accepted);

  {
    auto Range = BI->findBlocksOn(Addr{0});
    EXPECT_EQ(std::distance(Range.begin(), Range.end()), 0);
  }

  {
    auto Range = BI->findBlocksOn(Addr{5});
    EXPECT_EQ(std::distance(Range.begin(), Range.end()), 2);
  }
}

TEST(Unit_ByteInterval, iterationOrder) {
  auto* BI = ByteInterval::Create(Ctx, Addr{0}, 10);
  auto* B1Or2A = BI->addBlock<CodeBlock>(Ctx, 0, 0, DecodeMode::Default);
  auto* B1Or2B = BI->addBlock<CodeBlock>(Ctx, 0, 0, DecodeMode::Default);
  auto* B3 = BI->addBlock<CodeBlock>(Ctx, 0, 0, DecodeMode::Thumb);
  auto* B4 = BI->addBlock<DataBlock>(Ctx, 0, 0);
  auto* B5 = BI->addBlock<CodeBlock>(Ctx, 0, 1);

  // We can't control what UUID the blocks are given, but they are part of the
  // sort key. Pick an expectation dynamically based on how they compare.
  if (B1Or2A->getUUID() < B1Or2B->getUUID()) {
    std::vector<Node*> ExpectedOrder = {B1Or2A, B1Or2B, B3, B4, B5};
    EXPECT_EQ(pointers(BI->blocks()), ExpectedOrder);
  } else {
    std::vector<Node*> ExpectedOrder = {B1Or2B, B1Or2A, B3, B4, B5};
    EXPECT_EQ(pointers(BI->blocks()), ExpectedOrder);
  }
}

TEST(Unit_ByteInterval, iterationOrderMoveBlock) {
  auto* BI = ByteInterval::Create(Ctx, Addr{0}, 10);
  auto* B1 = BI->addBlock<DataBlock>(Ctx, 0, 2);
  auto* B2 = BI->addBlock<CodeBlock>(Ctx, 2, 0);
  {
    std::vector<Node*> ExpectedOrder = {B1, B2};
    EXPECT_EQ(pointers(BI->blocks()), ExpectedOrder);
  }

  BI->addBlock(0, B2);
  {
    std::vector<Node*> ExpectedOrder = {B2, B1};
    EXPECT_EQ(pointers(BI->blocks()), ExpectedOrder);
  }
}

TEST(Unit_ByteInterval, iterationOrderSetSize) {
  auto* BI = ByteInterval::Create(Ctx, Addr{0}, 10);
  auto* B1 = BI->addBlock<DataBlock>(Ctx, 0, 0);
  auto* B2 = BI->addBlock<CodeBlock>(Ctx, 0, 2);
  {
    std::vector<Node*> ExpectedOrder = {B1, B2};
    EXPECT_EQ(pointers(BI->blocks()), ExpectedOrder);
  }

  B1->setSize(50);
  {
    std::vector<Node*> ExpectedOrder = {B2, B1};
    EXPECT_EQ(pointers(BI->blocks()), ExpectedOrder);
  }
}

TEST(Unit_ByteInterval, iterationOrderSetDecodeMode) {
  auto* BI = ByteInterval::Create(Ctx, Addr{0}, 10);
  auto* B1 = BI->addBlock<CodeBlock>(Ctx, 0, 0, DecodeMode::Default);
  auto* B2 = BI->addBlock<CodeBlock>(Ctx, 0, 0, DecodeMode::Thumb);
  {
    std::vector<Node*> ExpectedOrder = {B1, B2};
    EXPECT_EQ(pointers(BI->blocks()), ExpectedOrder);
  }

  B1->setDecodeMode(DecodeMode::Thumb);
  B2->setDecodeMode(DecodeMode::Default);
  {
    std::vector<Node*> ExpectedOrder = {B2, B1};
    EXPECT_EQ(pointers(BI->blocks()), ExpectedOrder);
  }
}


================================================
FILE: src/test/CFG.test.cpp
================================================
//===- CFG.test.cpp ---------------------------------------------*- C++ -*-===//
//
//  Copyright (C) 2021 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
#include "SerializationTestHarness.hpp"
#include <gtirb/CFG.hpp>
#include <gtirb/CodeBlock.hpp>
#include <gtirb/Context.hpp>
#include <gtirb/ProxyBlock.hpp>
#include <gtirb/proto/CFG.pb.h>
#include <gtest/gtest.h>
#include <map>
#include <sstream>

using namespace gtirb;

TEST(Unit_CFG, compilationIteratorTypes) {
  static_assert(std::is_same_v<cfg_iterator::reference, CfgNode&>);
  static_assert(std::is_same_v<const_cfg_iterator::reference, const CfgNode&>);
  {
    cfg_iterator it;
    const_cfg_iterator cit(it);
    cit = it;
  }

  static_assert(std::is_same_v<block_iterator::reference, CodeBlock&>);
  static_assert(
      std::is_same_v<const_block_iterator::reference, const CodeBlock&>);
  {
    block_iterator it;
    const_block_iterator cit(it);
    cit = it;
  }

  // Check const-convertibility of [const_]cfg_predecessors_range[::iterator]
  static_assert(
      std::is_same_v<cfg_predecessors_range::iterator::reference::first_type,
                     CfgNode*>);
  static_assert(std::is_same_v<
                const_cfg_predecessors_range::iterator::reference::first_type,
                const CfgNode*>);
  static_assert(std::is_convertible_v<cfg_predecessors_range,
                                      const_cfg_predecessors_range>);
  static_assert(!std::is_convertible_v<const_cfg_predecessors_range,
                                       cfg_predecessors_range>);
  static_assert(std::is_convertible_v<cfg_predecessors_range::iterator,
                                      const_cfg_predecessors_range::iterator>);
  static_assert(!std::is_convertible_v<const_cfg_predecessors_range::iterator,
                                       cfg_predecessors_range::iterator>);
  // Repeat for ..._successors_...
  static_assert(
      std::is_same_v<cfg_successors_range::iterator::reference::first_type,
                     CfgNode*>);
  static_assert(std::is_same_v<
                const_cfg_successors_range::iterator::reference::first_type,
                const CfgNode*>);
  // Const-convertibility of [const_]cfg_successors_range[::iterator]
  static_assert(
      std::is_convertible_v<cfg_successors_range, const_cfg_successors_range>);
  static_assert(
      !std::is_convertible_v<const_cfg_successors_range, cfg_successors_range>);
  static_assert(std::is_convertible_v<cfg_successors_range::iterator,
                                      const_cfg_successors_range::iterator>);
  static_assert(!std::is_convertible_v<const_cfg_successors_range::iterator,
                                       cfg_successors_range::iterator>);
}

static Context Ctx;

TEST(Unit_CFG, addVertex) {
  CFG Cfg;
  auto* B = CodeBlock::Create(Ctx, 2);
  auto [Descriptor1, Added1] = addVertex(B, Cfg);
  EXPECT_TRUE(Added1);
  EXPECT_EQ(Cfg[Descriptor1], B);
  EXPECT_EQ(dyn_cast<CodeBlock>(Cfg[Descriptor1])->getSize(), 2);

  // adding the same block again doesn't change the graph
  auto [Descriptor2, Added2] = addVertex(B, Cfg);
  EXPECT_FALSE(Added2);
  EXPECT_EQ(Descriptor2, Descriptor1);
  auto Vertices = vertices(Cfg);
  EXPECT_EQ(std::distance(Vertices.first, Vertices.second), 1);

  auto* P = ProxyBlock::Create(Ctx);
  auto [Descriptor3, Added3] = addVertex(P, Cfg);
  EXPECT_TRUE(Added3);
  EXPECT_EQ(Cfg[Descriptor3], P);
  auto [Descriptor4, Added4] = addVertex(P, Cfg);
  EXPECT_FALSE(Added4);
  EXPECT_EQ(Descriptor4, Descriptor3);
  Vertices = vertices(Cfg);
  EXPECT_EQ(std::distance(Vertices.first, Vertices.second), 2);
}

TEST(Unit_CFG, getVertex) {
  CFG Cfg;
  auto* B = CodeBlock::Create(Ctx, 2);
  auto* P = ProxyBlock::Create(Ctx);
  auto DescriptorB = addVertex(B, Cfg).first;
  auto DescriptorP = addVertex(P, Cfg).first;
  EXPECT_EQ(getVertex(B, Cfg), DescriptorB);
  EXPECT_EQ(getVertex(P, Cfg), DescriptorP);
}

TEST(Unit_CFG, removeVertex) {
  CFG Cfg;
  CfgNode* B1 = CodeBlock::Create(Ctx, 0);
  CfgNode* B2 = CodeBlock::Create(Ctx, 1);
  addVertex(B1, Cfg);
  addVertex(B2, Cfg);

  {
    auto [Begin, End] = vertices(Cfg);
    ASSERT_EQ(std::distance(Begin, End), 2);
    EXPECT_EQ((std::set<CfgNode*>{Cfg[*Begin], Cfg[*std::next(Begin)]}),
              (std::set<CfgNode*>{B1, B2}));
    ASSERT_TRUE(getVertex(B1, Cfg));
    EXPECT_EQ(Cfg[*getVertex(B1, Cfg)], B1);
    ASSERT_TRUE(getVertex(B2, Cfg));
    EXPECT_EQ(Cfg[*getVertex(B2, Cfg)], B2);
  }

  removeVertex(B1, Cfg);

  {
    auto [Begin, End] = vertices(Cfg);
    ASSERT_EQ(std::distance(Begin, End), 1);
    EXPECT_EQ(Cfg[*Begin], B2);
    ASSERT_TRUE(getVertex(B2, Cfg));
    EXPECT_EQ(Cfg[*getVertex(B2, Cfg)], B2);
  }

  addVertex(B1, Cfg);

  {
    auto [Begin, End] = vertices(Cfg);
    ASSERT_EQ(std::distance(Begin, End), 2);
    EXPECT_EQ((std::set<CfgNode*>{Cfg[*Begin], Cfg[*std::next(Begin)]}),
              (std::set<CfgNode*>{B1, B2}));

    ASSERT_TRUE(getVertex(B1, Cfg));
    EXPECT_EQ(Cfg[*getVertex(B1, Cfg)], B1);
    ASSERT_TRUE(getVertex(B2, Cfg));
    EXPECT_EQ(Cfg[*getVertex(B2, Cfg)], B2);
  }
}

TEST(Unit_CFG, cfgIterator) {
  CFG Cfg;
  auto* B1 = CodeBlock::Create(Ctx, 2);
  auto* P1 = ProxyBlock::Create(Ctx);
  auto* B2 = CodeBlock::Create(Ctx, 2);
  auto* P2 = ProxyBlock::Create(Ctx);
  addVertex(B1, Cfg);
  addVertex(P1, Cfg);
  addVertex(B2, Cfg);
  addVertex(P2, Cfg);

  // Non-const graph produces a regular iterator
  boost::iterator_range<cfg_iterator> NodeRange = nodes(Cfg);
  EXPECT_EQ(std::distance(NodeRange.begin(), NodeRange.end()), 4);
  auto It = NodeRange.begin();
  EXPECT_EQ(&*It, B1);
  ++It;
  EXPECT_EQ(&*It, P1);
  ++It;
  EXPECT_EQ(&*It, B2);
  ++It;
  EXPECT_EQ(&*It, P2);
  ++It;
  EXPECT_EQ(It, NodeRange.end());

  // Const graph produces a const iterator
  const CFG& ConstCfg = Cfg;
  boost::iterator_range<const_cfg_iterator> ConstRange = nodes(ConstCfg);
  EXPECT_EQ(std::distance(ConstRange.begin(), ConstRange.end()), 4);
  auto Cit = ConstRange.begin();
  EXPECT_EQ(&*Cit, B1);
  ++Cit;
  EXPECT_EQ(&*Cit, P1);
  ++Cit;
  EXPECT_EQ(&*Cit, B2);
  ++Cit;
  EXPECT_EQ(&*Cit, P2);
  ++Cit;
  EXPECT_EQ(Cit, ConstRange.end());
}

TEST(Unit_CFG, blockIterator) {
  CFG Cfg;
  addVertex(CodeBlock::Create(Ctx, 1), Cfg);
  addVertex(CodeBlock::Create(Ctx, 2), Cfg);
  addVertex(CodeBlock::Create(Ctx, 3), Cfg);
  addVertex(ProxyBlock::Create(Ctx), Cfg);

  // Non-const graph produces a regular iterator
  boost::iterator_range<block_iterator> BlockRange = blocks(Cfg);
  EXPECT_EQ(std::distance(BlockRange.begin(), BlockRange.end()), 3);
  auto It = BlockRange.begin();
  EXPECT_EQ(It->getSize(), 1);
  ++It;
  EXPECT_EQ(It->getSize(), 2);
  ++It;
  EXPECT_EQ(It->getSize(), 3);
  ++It;
  EXPECT_EQ(It, BlockRange.end());

  // Const graph produces a const iterator
  const CFG& ConstCfg = Cfg;
  boost::iterator_range<const_block_iterator> ConstRange = blocks(ConstCfg);
  EXPECT_EQ(std::distance(ConstRange.begin(), ConstRange.end()), 3);
  auto Cit = ConstRange.begin();
  EXPECT_EQ(Cit->getSize(), 1);
  ++Cit;
  EXPECT_EQ(Cit->getSize(), 2);
  ++Cit;
  EXPECT_EQ(Cit->getSize(), 3);
  ++Cit;
  EXPECT_EQ(Cit, ConstRange.end());
}

// Helper for validating cfgPredecessors and cfgSuccessors.
// Uses a multimap to normalize (sort) values, even though the pointer-based
// ordering may change between processes.
typedef std::multimap<const CfgNode*, EdgeLabel> NodeEdgeMMap;
template <typename ContainerT> NodeEdgeMMap toMultiMap(const ContainerT& C) {
  // Note: this could be implemented with the following one-liner:
  //    return NodeEdgeMMap(C.begin(), C.end());
  // but instead we use the following loop construct, which is the expected
  // common usage of the cfgPredecessors/cfgSuccessors interface.
  NodeEdgeMMap Result;
  for (auto [Node, Label] : C) {
    Result.emplace(Node, Label);
  }
  return Result;
}

TEST(Unit_CFG, edges) {
  CFG Cfg;
  auto B1 = CodeBlock::Create(Ctx, 1);
  auto B2 = CodeBlock::Create(Ctx, 2);
  auto P1 = ProxyBlock::Create(Ctx);
  addVertex(B1, Cfg);
  addVertex(B2, Cfg);
  addVertex(P1, Cfg);

  auto E1 = addEdge(B1, P1, Cfg);
  EXPECT_EQ(Cfg[source(*E1, Cfg)], B1);
  EXPECT_EQ(Cfg[target(*E1, Cfg)], P1);

  auto E2 = addEdge(B2, P1, Cfg);
  EXPECT_EQ(Cfg[source(*E2, Cfg)], B2);
  EXPECT_EQ(Cfg[target(*E2, Cfg)], P1);

  auto E3 = addEdge(P1, B1, Cfg);
  EXPECT_EQ(Cfg[source(*E3, Cfg)], P1);
  EXPECT_EQ(Cfg[target(*E3, Cfg)], B1);

  // Parallel edge
  auto E4 = addEdge(B1, P1, Cfg);
  EXPECT_EQ(Cfg[source(*E4, Cfg)], B1);
  EXPECT_EQ(Cfg[target(*E4, Cfg)], P1);

  // Successor edge iterator
  EXPECT_EQ(toMultiMap(cfgSuccessors(Cfg, B1)),
            (NodeEdgeMMap{{P1, std::nullopt}, {P1, std::nullopt}}));
  EXPECT_EQ(toMultiMap(cfgSuccessors(Cfg, B2)),
            (NodeEdgeMMap{{P1, std::nullopt}}));
  EXPECT_EQ(toMultiMap(cfgSuccessors(Cfg, P1)),
            (NodeEdgeMMap{{B1, std::nullopt}}));

  // Predecessor edge iterator
  EXPECT_EQ(toMultiMap(cfgPredecessors(Cfg, P1)),
            (NodeEdgeMMap{
                {B1, std::nullopt}, {B1, std::nullopt}, {B2, std::nullopt}}));
  EXPECT_EQ(toMultiMap(cfgPredecessors(Cfg, B1)),
            (NodeEdgeMMap{{P1, std::nullopt}}));
  EXPECT_EQ(toMultiMap(cfgPredecessors(Cfg, B2)), (NodeEdgeMMap{}));

  // Const vs. non-const edge iterator: check constness of referenced CfgNode.
  static_assert(
      std::is_same_v<gtirb::CfgNode*,
                     decltype(cfgSuccessors(Cfg, B1).begin()->first)>);
  static_assert(
      std::is_same_v<
          const gtirb::CfgNode*,
          decltype(cfgSuccessors(std::as_const(Cfg), B1).begin()->first)>);
  // Const vs. non-const edge iterator, in structured-binding context.
  for (auto [Node, Label] : cfgSuccessors(Cfg, B1)) {
    static_assert(std::is_same_v<gtirb::CfgNode*, decltype(Node)>);
    (void)Label;
  }
  for (auto [Node, Label] : cfgSuccessors(std::as_const(Cfg), B1)) {
    static_assert(std::is_same_v<const gtirb::CfgNode*, decltype(Node)>);
    (void)Label;
  }

  // Remove edge part
  {
    auto [Begin, End] = edges(Cfg);
    ASSERT_EQ(std::distance(Begin, End), 4);
  }

  // Remove one edge
  removeEdge(B2, P1, Cfg);
  {
    auto [It, End] = edges(Cfg);
    ASSERT_EQ(std::distance(It, End), 3);
    EXPECT_EQ(Cfg[source(*It, Cfg)], B1);
    EXPECT_EQ(Cfg[target(*It, Cfg)], P1);
    ++It;
    EXPECT_EQ(Cfg[source(*It, Cfg)], P1);
    EXPECT_EQ(Cfg[target(*It, Cfg)], B1);
    ++It;
    EXPECT_EQ(Cfg[source(*It, Cfg)], B1);
    EXPECT_EQ(Cfg[target(*It, Cfg)], P1);
  }

  // Remove parallel edges
  removeEdge(B1, P1, Cfg);
  {
    auto [Begin, End] = edges(Cfg);
    ASSERT_EQ(std::distance(Begin, End), 1);
    EXPECT_EQ(Cfg[source(*Begin, Cfg)], P1);
    EXPECT_EQ(Cfg[target(*Begin, Cfg)], B1);
  }

  // Remove not existing edge
  auto B3 = CodeBlock::Create(Ctx, 3);
  EXPECT_FALSE(removeEdge(B3, P1, Cfg));
  EXPECT_FALSE(removeEdge(P1, B3, Cfg));
}

TEST(Unit_CFG, edgeLabelPrinting) {
  std::stringstream LabelOutput;
  gtirb::EdgeLabel Label;
  LabelOutput << Label;
  EXPECT_EQ(LabelOutput.str(), "<No EdgeLabel>");

  Label.emplace(gtirb::ConditionalEdge::OnFalse, gtirb::DirectEdge::IsDirect,
                gtirb::EdgeType::Fallthrough);
  LabelOutput.str(std::string());
  LabelOutput << Label;
  EXPECT_EQ(LabelOutput.str(), "(OnFalse, IsDirect, Fallthrough)");
}

TEST(Unit_CFG, edgeLabels) {
  CFG Cfg;
  auto B1 = CodeBlock::Create(Ctx, 1);
  auto B2 = CodeBlock::Create(Ctx, 2);
  addVertex(B1, Cfg);
  addVertex(B2, Cfg);

  // Create an edge with no label
  auto E = addEdge(B2, B1, Cfg);
  EXPECT_FALSE(Cfg[*E]);

  auto Conds = {ConditionalEdge::OnFalse, ConditionalEdge::OnTrue};
  auto Dirs = {DirectEdge::IsDirect, DirectEdge::IsIndirect};
  auto Types = {EdgeType::Branch, EdgeType::Call,    EdgeType::Fallthrough,
                EdgeType::Return, EdgeType::Syscall, EdgeType::Sysret};

  // Create a number of parallel edges with different labels.
  std::vector<CFG::edge_descriptor> Descriptors;
  NodeEdgeMMap EdgesToCheck;
  for (ConditionalEdge Cond : Conds) {
    for (DirectEdge Dir : Dirs) {
      for (EdgeType Type : Types) {
        E = addEdge(B1, B2, Cfg);
        const EdgeLabel Label{std::in_place, Cond, Dir, Type};
        Cfg[*E] = Label;
        Descriptors.push_back(*E);
        EdgesToCheck.emplace(B2, Label);
      }
    }
  }

  // Check that the edges have the properties we assigned.
  auto It = Descriptors.begin();
  for (ConditionalEdge Cond : Conds) {
    for (DirectEdge Dir : Dirs) {
      for (EdgeType Type : Types) {
        EXPECT_TRUE(Cfg[*It]);
        EXPECT_EQ(std::get<ConditionalEdge>(*Cfg[*It]), Cond);
        EXPECT_EQ(std::get<DirectEdge>(*Cfg[*It]), Dir);
        EXPECT_EQ(std::get<EdgeType>(*Cfg[*It]), Type);
        ++It;
      }
    }
  }
  // Successor edge iterator check
  EXPECT_EQ(toMultiMap(cfgSuccessors(Cfg, B1)), EdgesToCheck);

  // Remove an edge with a label part
  const EdgeLabel Label{std::in_place, ConditionalEdge::OnFalse,
                        DirectEdge::IsDirect, EdgeType::Branch};
  {
    auto [Begin, End] = edges(Cfg);
    ASSERT_EQ(std::distance(Begin, End), 25);
  }
  // Remove non existing edge
  // There is B2 -> B1 edge without a label
  removeEdge(B2, B1,
             EdgeLabel{std::in_place, ConditionalEdge::OnTrue,
                       DirectEdge::IsDirect, EdgeType::Fallthrough},
             Cfg);
  {
    auto [Begin, End] = edges(Cfg);
    ASSERT_EQ(std::distance(Begin, End), 25);
  }
  // Remove the given edge
  removeEdge(B1, B2, Label, Cfg);
  {
    auto [Begin, End] = edges(Cfg);
    ASSERT_EQ(std::distance(Begin, End), 24);
  }
  // Check that the correct edge removed
  {
    auto [ie, end] = edges(Cfg);
    while (ie != end) {
      if (Cfg[*ie]) {
        if ((Cfg[source(*ie, Cfg)], B1) && (Cfg[target(*ie, Cfg)], B2) &&
            (std::get<ConditionalEdge>(*Cfg[*ie]) ==
             std::get<ConditionalEdge>(*Label)) &&
            (std::get<DirectEdge>(*Cfg[*ie]) == std::get<DirectEdge>(*Label)) &&
            (std::get<EdgeType>(*Cfg[*ie]) == std::get<EdgeType>(*Label))) {
          EXPECT_FALSE(true);
        }
      }
      ++ie;
    }
  }
  // Check that 2 parallel edges with the same same label can be deleted
  // Create 2 parallel edges
  E = addEdge(B1, B2, Cfg);
  Cfg[*E] = Label;
  E = addEdge(B1, B2, Cfg);
  Cfg[*E] = Label;
  {
    auto [Begin, End] = edges(Cfg);
    ASSERT_EQ(std::distance(Begin, End), 26);
  }
  // Remove them
  removeEdge(B1, B2, Label, Cfg);
  {
    auto [Begin, End] = edges(Cfg);
    ASSERT_EQ(std::distance(Begin, End), 24);
  }
  // Create second paralle edge with no label
  E = addEdge(B2, B1, Cfg);
  EXPECT_FALSE(Cfg[*E]);
  {
    auto [Begin, End] = edges(Cfg);
    ASSERT_EQ(std::distance(Begin, End), 25);
  }
  // Remove 2 parallel edges with no labels
  removeEdge(B2, B1, std::nullopt, Cfg);
  {
    auto [Begin, End] = edges(Cfg);
    ASSERT_EQ(std::distance(Begin, End), 23);
  }
  // Check that there are no edges without label
  {
    auto [ie, end] = edges(Cfg);
    while (ie != end) {
      EXPECT_TRUE(Cfg[*ie]);
      ++ie;
    }
  }
}

TEST(Unit_CFG, protobufRoundTrip) {
  CFG Result;
  std::stringstream ss;

  auto B1 = CodeBlock::Create(Ctx, 1, DecodeMode::Default);
  auto B2 = CodeBlock::Create(Ctx, 3, DecodeMode::Thumb);
  auto P1 = ProxyBlock::Create(Ctx);
  {
    CFG Original;
    addVertex(B1, Original);
    addVertex(B2, Original);
    addVertex(P1, Original);

    auto E1 = addEdge(B1, P1, Original);
    auto E2 = addEdge(B2, P1, Original);
    addEdge(P1, B1, Original);
    Original[*E1] = std::make_tuple(ConditionalEdge::OnTrue,
                                    DirectEdge::IsDirect, EdgeType::Branch);
    Original[*E2] = std::make_tuple(ConditionalEdge::OnFalse,
                                    DirectEdge::IsIndirect, EdgeType::Call);

    cfgSave(Original, ss);
  }
  cfgLoad(Ctx, Result, ss);

  auto Range = nodes(Result);
  EXPECT_EQ(std::distance(Range.begin(), Range.end()), 3);
  auto It = Range.begin();
  EXPECT_EQ(It->getUUID(), B1->getUUID());
  EXPECT_EQ(dyn_cast<CodeBlock>(&*It)->getSize(), 1);
  EXPECT_EQ(dyn_cast<CodeBlock>(&*It)->getDecodeMode(), DecodeMode::Default);
  ++It;
  EXPECT_EQ(It->getUUID(), B2->getUUID());
  EXPECT_EQ(dyn_cast<CodeBlock>(&*It)->getSize(), 3);
  EXPECT_EQ(dyn_cast<CodeBlock>(&*It)->getDecodeMode(), DecodeMode::Thumb);
  ++It;
  EXPECT_EQ(It->getUUID(), P1->getUUID());

  // Check edges
  EXPECT_TRUE(
      edge(*getVertex(B1, Result), *getVertex(P1, Result), Result).second);
  EXPECT_TRUE(
      edge(*getVertex(B2, Result), *getVertex(P1, Result), Result).second);
  EXPECT_TRUE(
      edge(*getVertex(P1, Result), *getVertex(B1, Result), Result).second);

  // Check nonexistent edges
  EXPECT_FALSE(
      edge(*getVertex(B1, Result), *getVertex(B2, Result), Result).second);
  EXPECT_FALSE(
      edge(*getVertex(B2, Result), *getVertex(B1, Result), Result).second);
  EXPECT_FALSE(
      edge(*getVertex(P1, Result), *getVertex(B2, Result), Result).second);

  // Check labels
  auto E1 = edge(*getVertex(B1, Result), *getVertex(P1, Result), Result).first;
  EXPECT_EQ(std::get<ConditionalEdge>(*Result[E1]), ConditionalEdge::OnTrue);
  EXPECT_EQ(std::get<DirectEdge>(*Result[E1]), DirectEdge::IsDirect);
  EXPECT_EQ(std::get<EdgeType>(*Result[E1]), EdgeType::Branch);

  auto E2 = edge(*getVertex(B2, Result), *getVertex(P1, Result), Result).first;
  EXPECT_EQ(std::get<ConditionalEdge>(*Result[E2]), ConditionalEdge::OnFalse);
  EXPECT_EQ(std::get<DirectEdge>(*Result[E2]), DirectEdge::IsIndirect);
  EXPECT_EQ(std::get<EdgeType>(*Result[E2]), EdgeType::Call);

  auto E3 = edge(*getVertex(P1, Result), *getVertex(B1, Result), Result).first;
  EXPECT_FALSE(Result[E3]);
}


================================================
FILE: src/test/CMakeLists.txt
================================================
# TestGTIRB
#
# This is the main executable containing unit tests for the GTIRB C++ API.
set(PROJECT_NAME TestGTIRB)

enable_testing()
include_directories(${GTEST_INCLUDE_DIRS})
include_directories(${CMAKE_CURRENT_BINARY_DIR})

add_compile_options(-DDEBUG)

# Required warning suppression (TODO: Remove!)
if(${CMAKE_CXX_COMPILER_ID} STREQUAL MSVC)
  # add_compile_options(-wd4251)  # Non-exportable template classes.
  add_compile_options(-wd4389) # signed/unsigned mismatch (in gtest headers)
elseif(${CMAKE_CXX_COMPILER_ID} STREQUAL GNU)
  add_compile_options(-fpermissive)
  add_compile_options(-mtune=generic)
  add_compile_options(-pthread)
elseif(${CMAKE_CXX_COMPILER_ID} STREQUAL Clang)
  add_compile_options(-fpermissive)
  add_compile_options(-mtune=generic)
  add_compile_options(-pthread)
endif()

# Check for access to resource.h
include(CheckIncludeFiles)
check_include_files(sys/resource.h HAVE_RESOURCE_H)
configure_file(
  ${CMAKE_CURRENT_SOURCE_DIR}/config-test.h.in
  ${CMAKE_CURRENT_BINARY_DIR}/config-test.h
)

set(${PROJECT_NAME}_H AuxDataContainerSchema.hpp Main.test.hpp
                      PrepDeathTest.hpp
)

set(${PROJECT_NAME}_SRC
    Addr.test.cpp
    Allocator.test.cpp
    AuxData.test.cpp
    AuxDataContainer.test.cpp
    ByteInterval.test.cpp
    CFG.test.cpp
    CodeBlock.test.cpp
    DataBlock.test.cpp
    IR.test.cpp
    Main.test.cpp
    MergeSortedIterator.test.cpp
    Module.test.cpp
    Node.test.cpp
    Offset.test.cpp
    ProxyBlock.test.cpp
    Section.test.cpp
    Symbol.test.cpp
    SymbolicExpression.test.cpp
    TypedNodeTest.cpp
)

if(UNIX AND NOT WIN32)
  set(SYSLIBS dl)
else()
  set(SYSLIBS)
endif()

add_executable(${PROJECT_NAME} ${${PROJECT_NAME}_H} ${${PROJECT_NAME}_SRC})
set_target_properties(${PROJECT_NAME} PROPERTIES FOLDER "gtirb/test")
target_compile_definitions(
  ${PROJECT_NAME} PRIVATE GTIRB_WRAP_UTILS_IN_NAMESPACE
)

target_link_libraries(
  ${PROJECT_NAME} ${SYSLIBS} ${Boost_LIBRARIES} gtest gtest_main gtirb
)

# PrepTestGTIRB
#
# This binary's purpose is to construct a GTIRB IR file in one process that has
# a certain set of AUxData schemas registered that is different from the set
# registered in TestGTIRB, allowing tests in TestGTIRB to exercise functionality
# that is specific to handling unregistered schemas.
set(PROJECT_NAME PrepTestGTIRB)

set(${PROJECT_NAME}_H AuxDataContainerSchema.hpp)

set(${PROJECT_NAME}_SRC PrepTestGTIRB.cpp)

add_executable(${PROJECT_NAME} ${${PROJECT_NAME}_H} ${${PROJECT_NAME}_SRC})
set_target_properties(${PROJECT_NAME} PROPERTIES FOLDER "gtirb/test")
target_compile_definitions(
  ${PROJECT_NAME} PRIVATE GTIRB_WRAP_UTILS_IN_NAMESPACE
)

target_link_libraries(${PROJECT_NAME} ${SYSLIBS} ${Boost_LIBRARIES} gtirb)

# Add a single test that runs both the PrepTestGTIRB and TestGTIRB executables
# in sequence, passing the output GTIRB file from the former to the latter.
add_test(
  NAME testgtirbc++
  COMMAND ${CMAKE_COMMAND} -DCMD1=$<TARGET_FILE:PrepTestGTIRB>
          -DCMD2=$<TARGET_FILE:TestGTIRB> -P
          ${CMAKE_CURRENT_SOURCE_DIR}/runtests.cmake
)

# testgtirb_schemac++
#
# This is a separate test executable setup explicitly to exercise AuxData schema
# registration code that runs before the AuxData TypeMap gets locked. These
# tests cannot be effectively executed in the main test executable above, which
# locks the TypeMap before any of the tests are executed.
set(PROJECT_NAME testgtirb_schemac++)

set(${PROJECT_NAME}_H AuxDataContainerSchema.hpp PrepDeathTest.hpp)

set(${PROJECT_NAME}_SRC AuxDataSchemaRegistration.test.cpp)

# Add this test to ctest
gtirb_add_executable_gtest()
target_compile_definitions(
  ${PROJECT_NAME} PRIVATE GTIRB_WRAP_UTILS_IN_NAMESPACE
)

target_link_libraries(
  ${PROJECT_NAME} ${SYSLIBS} ${Boost_LIBRARIES} gtest gtest_main gtirb
)

# testgtirb_deprecated_utils
#
# This separate test executable does NOT define GTIRB_WRAP_UTILS_IN_NAMESPACE
set(PROJECT_NAME testgtirb_deprecated_utils)

set(${PROJECT_NAME}_SRC UtilsUsingGtirbNamespace.test.cpp
                        UtilsDeprecatedGlobals.test.cpp
)

gtirb_add_executable_gtest()

if((CMAKE_CXX_COMPILER_ID STREQUAL "GNU") OR (${CMAKE_CXX_COMPILER_ID} STREQUAL
                                              Clang)
)
  # Disable deprecation warnings
  target_compile_options(${PROJECT_NAME} PRIVATE -Wno-deprecated-declarations)
endif()

target_link_libraries(
  ${PROJECT_NAME} ${SYSLIBS} ${Boost_LIBRARIES} gtest gtest_main gtirb
)

add_subdirectory(testInputBinary)
add_subdirectory(testInterop)


================================================
FILE: src/test/CodeBlock.test.cpp
================================================
//===- CodeBlock.test.cpp ---------------------------------------*- C++ -*-===//
//
//  Copyright (C) 2020 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
#include "SerializationTestHarness.hpp"
#include <gtirb/ByteInterval.hpp>
#include <gtirb/CodeBlock.hpp>
#include <gtirb/Context.hpp>
#include <gtest/gtest.h>
#include <sstream>

using namespace gtirb;

static Context Ctx;

TEST(Unit_CodeBlock, noCopyMoveConstructors) {
  EXPECT_FALSE(std::is_copy_constructible_v<CodeBlock>);
  EXPECT_FALSE(std::is_move_constructible_v<CodeBlock>);
  EXPECT_FALSE(std::is_copy_assignable_v<CodeBlock>);
  EXPECT_FALSE(std::is_move_assignable_v<CodeBlock>);
}

TEST(Unit_CodeBlock, ctor) { EXPECT_NE(CodeBlock::Create(Ctx, 0), nullptr); }

TEST(Unit_CodeBlock, getters) {
  auto* BI = ByteInterval::Create(Ctx, Addr(0), 2);
  auto* B = BI->addBlock<CodeBlock>(Ctx, 0, 1, DecodeMode::Thumb);

  EXPECT_EQ(Addr{0}, B->getAddress());
  EXPECT_EQ(uint64_t{1}, B->getSize());
  EXPECT_EQ(DecodeMode::Thumb, B->getDecodeMode());
  EXPECT_EQ(BI, B->getByteInterval());
}

TEST(Unit_CodeBlock, getAddress) {
  auto* BI = ByteInterval::Create(Ctx, Addr(10), 10);
  auto* B1 = BI->addBlock<CodeBlock>(Ctx, 0, 0);
  auto* B2 = BI->addBlock<CodeBlock>(Ctx, 1, 0);
  auto* B3 = BI->addBlock<CodeBlock>(Ctx, 10, 0);

  EXPECT_EQ(B1->getAddress(), Addr{10});
  EXPECT_EQ(B2->getAddress(), Addr{11});
  EXPECT_EQ(B3->getAddress(), Addr{20});

  BI->setAddress({});
  EXPECT_EQ(B1->getAddress(), std::optional<Addr>());
  EXPECT_EQ(B2->getAddress(), std::optional<Addr>());
  EXPECT_EQ(B3->getAddress(), std::optional<Addr>());
}

TEST(Unit_CodeBlock, byteVector) {
  std::string Contents = "hello, world!";
  auto* BI = ByteInterval::Create(Ctx, std::optional<Addr>(), Contents.begin(),
                                  Contents.end());
  auto* B = BI->addBlock<CodeBlock>(Ctx, 3, 4);

  auto OriginalIt = Contents.begin() + 3;
  auto NewIt = B->bytes_begin<char>();
  auto OriginalEnd = OriginalIt + 4;
  auto NewEnd = B->bytes_end<char>();

  while (OriginalIt != OriginalEnd && NewIt != NewEnd) {
    EXPECT_EQ(*OriginalIt, *NewIt);
    ++OriginalIt;
    ++NewIt;
  }
  EXPECT_EQ(OriginalIt, OriginalEnd);
  EXPECT_EQ(NewIt, NewEnd);
}

TEST(Unit_CodeBlock, protobufRoundTrip) {
  using STH = gtirb::SerializationTestHarness;
  std::stringstream ss;
  {
    Context InnerCtx;
    CodeBlock* Original = CodeBlock::Create(InnerCtx, 1234, DecodeMode::Thumb);
    STH::save(*Original, ss);
  }
  CodeBlock* Result = STH::load<CodeBlock>(Ctx, ss);

  EXPECT_EQ(Result->getSize(), 1234);
  EXPECT_EQ(Result->getDecodeMode(), DecodeMode::Thumb);
  EXPECT_EQ(Result->getByteInterval(), nullptr);
}


================================================
FILE: src/test/DataBlock.test.cpp
================================================
//===- DataBlock.test.cpp --------------------------------------*- C++ -*-===//
//
//  Copyright (C) 2020 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
#include "SerializationTestHarness.hpp"
#include <gtirb/ByteInterval.hpp>
#include <gtirb/Context.hpp>
#include <gtirb/DataBlock.hpp>
#include <gtirb/proto/DataBlock.pb.h>
#include <gtest/gtest.h>
#include <sstream>

using namespace gtirb;

static Context Ctx;

TEST(Unit_DataBlock, noCopyMoveConstructors) {
  EXPECT_FALSE(std::is_copy_constructible_v<DataBlock>);
  EXPECT_FALSE(std::is_move_constructible_v<DataBlock>);
  EXPECT_FALSE(std::is_copy_assignable_v<DataBlock>);
  EXPECT_FALSE(std::is_move_assignable_v<DataBlock>);
}

TEST(Unit_DataBlock, getters) {
  auto* BI = ByteInterval::Create(Ctx, Addr(0), 2);
  auto* B = BI->addBlock<DataBlock>(Ctx, 0, 1);

  EXPECT_EQ(Addr{0}, B->getAddress());
  EXPECT_EQ(uint64_t{1}, B->getSize());
  EXPECT_EQ(BI, B->getByteInterval());
}

TEST(Unit_DataBlock, getAddress) {
  auto* BI = ByteInterval::Create(Ctx, Addr(10), 10);
  auto* B1 = BI->addBlock<DataBlock>(Ctx, 0, 0);
  auto* B2 = BI->addBlock<DataBlock>(Ctx, 1, 0);
  auto* B3 = BI->addBlock<DataBlock>(Ctx, 10, 0);

  EXPECT_EQ(B1->getAddress(), Addr{10});
  EXPECT_EQ(B2->getAddress(), Addr{11});
  EXPECT_EQ(B3->getAddress(), Addr{20});

  BI->setAddress({});
  EXPECT_EQ(B1->getAddress(), std::optional<Addr>());
  EXPECT_EQ(B2->getAddress(), std::optional<Addr>());
  EXPECT_EQ(B3->getAddress(), std::optional<Addr>());
}

TEST(Unit_DataBlock, protobufRoundTrip) {
  using STH = gtirb::SerializationTestHarness;
  std::stringstream ss;
  {
    Context InnerCtx;
    DataBlock* Original = DataBlock::Create(InnerCtx, 1234);
    STH::save(*Original, ss);
  }
  DataBlock* Result = STH::load<DataBlock>(Ctx, ss);

  EXPECT_EQ(Result->getSize(), 1234);
  EXPECT_EQ(Result->getByteInterval(), nullptr);
}

TEST(Unit_DataBlock, byteVector) {
  std::string Contents = "hello, world!";
  auto* BI = ByteInterval::Create(Ctx, std::optional<Addr>(), Contents.begin(),
                                  Contents.end());
  auto* B = BI->addBlock<DataBlock>(Ctx, 3, 4);

  auto OriginalIt = Contents.begin() + 3;
  auto NewIt = B->bytes_begin<char>();
  auto OriginalEnd = OriginalIt + 4;
  auto NewEnd = B->bytes_end<char>();

  while (OriginalIt != OriginalEnd && NewIt != NewEnd) {
    EXPECT_EQ(*OriginalIt, *NewIt);
    ++OriginalIt;
    ++NewIt;
  }
  EXPECT_EQ(OriginalIt, OriginalEnd);
  EXPECT_EQ(NewIt, NewEnd);
}


================================================
FILE: src/test/IR.test.cpp
================================================
//===- IR.test.cpp ----------------------------------------------*- C++ -*-===//
//
//  Copyright (C) 2021 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
#include "SerializationTestHarness.hpp"
#include <gtirb/AuxData.hpp>
#include <gtirb/Context.hpp>
#include <gtirb/DataBlock.hpp>
#include <gtirb/IR.hpp>
#include <gtirb/Module.hpp>
#include <gtirb/Section.hpp>
#include <gtirb/Symbol.hpp>
#include <gtirb/SymbolicExpression.hpp>
#include <gtirb/proto/IR.pb.h>
#include <gtest/gtest.h>
#include <sstream>

namespace gtirb {
namespace schema {

struct TestVectorInt64 {
  static constexpr const char* Name = "test vector<int64_t>";
  typedef std::vector<int64_t> Type;
};

struct FooVectorInt64 {
  static constexpr const char* Name = "foo vector<int64_t>";
  typedef std::vector<int64_t> Type;
};

struct AnAuxDataMap {
  static constexpr const char* Name = "AuxData map";
  typedef std::map<std::string, int64_t> Type;
};

struct BarVectorChar {
  static constexpr const char* Name = "bar vector<char>";
  typedef std::vector<char> Type;
};

struct TestInt32 {
  static constexpr const char* Name = "test int32";
  typedef int32_t Type;
};

} // namespace schema
} // namespace gtirb

using namespace gtirb;
using namespace gtirb::schema;

void registerIrTestAuxDataTypes() {
  AuxDataContainer::registerAuxDataType<TestVectorInt64>();
  AuxDataContainer::registerAuxDataType<FooVectorInt64>();
  AuxDataContainer::registerAuxDataType<AnAuxDataMap>();
  AuxDataContainer::registerAuxDataType<BarVectorChar>();
  AuxDataContainer::registerAuxDataType<TestInt32>();
}

static bool hasPreferredAddr(const Module& M, Addr X) {
  return M.getPreferredAddr() == X;
}

TEST(Unit_IR, compilationIteratorTypes) {
  static_assert(std::is_same_v<IR::module_iterator::reference, Module&>);
  static_assert(
      std::is_same_v<IR::const_module_iterator::reference, const Module&>);
  // Actually calling the constructor and assignment operator tends to produce
  // more informative error messages than std::is_constructible and
  // std::is_assignable.
  IR::module_iterator It;
  IR::const_module_iterator CIt(It);
  CIt = It;
}

TEST(Unit_IR, noCopyMoveConstructors) {
  EXPECT_FALSE(std::is_copy_constructible_v<IR>);
  EXPECT_FALSE(std::is_move_constructible_v<IR>);
  EXPECT_FALSE(std::is_copy_assignable_v<IR>);
  EXPECT_FALSE(std::is_move_assignable_v<IR>);
}

static Context Ctx;
TEST(Unit_IR, ctor_0) { EXPECT_NE(IR::Create(Ctx), nullptr); }

TEST(Unit_IR, addRemoveXferModules) {
  auto* I1 = IR::Create(Ctx);
  auto* I2 = IR::Create(Ctx);
  auto* M1 = Module::Create(Ctx, "M1");
  auto* M2 = Module::Create(Ctx, "M2");

  I1->addModule(M1);
  ASSERT_EQ(std::distance(I1->modules_begin(), I1->modules_end()), 1);
  EXPECT_EQ(&*I1->modules_begin(), M1);

  I1->addModule(M2);
  ASSERT_EQ(std::distance(I1->modules_begin(), I1->modules_end()), 2);
  EXPECT_EQ((std::set<Module*>{&*std::next(I1->modules_begin(), 0),
                               &*std::next(I1->modules_begin(), 1)}),
            (std::set<Module*>{M1, M2}));

  // Check addModule() removes the module from its former owner.

  I2->addModule(M1);
  ASSERT_EQ(std::distance(I1->modules_begin(), I1->modules_end()), 1);
  EXPECT_EQ(&*I1->modules_begin(), M2);
  ASSERT_EQ(std::distance(I2->modules_begin(), I2->modules_end()), 1);
  EXPECT_EQ(&*I2->modules_begin(), M1);

  // Check removeModule() does nothing if the IR does not own the Module.

  I1->removeModule(M1);
  ASSERT_EQ(std::distance(I1->modules_begin(), I1->modules_end()), 1);
  EXPECT_EQ(&*I1->modules_begin(), M2);
  ASSERT_EQ(std::distance(I2->modules_begin(), I2->modules_end()), 1);
  EXPECT_EQ(&*I2->modules_begin(), M1);

  // Check removeModule() removes the module if it is owned.
  I1->removeModule(M2);
  EXPECT_TRUE(I1->modules().empty());
}

TEST(Unit_IR, moduleIterationOrder) {
  auto* Ir = IR::Create(Ctx);
  auto* M1 = Ir->addModule(Ctx, "b");
  auto* M2 = Ir->addModule(Ctx, "a");
  auto* M3 = Ir->addModule(Ctx, "a");

  EXPECT_EQ(std::distance(Ir->modules_begin(), Ir->modules_end()), 3);
  auto It = Ir->modules_begin();
  // Order of M2 and M3 is unspecified.
  if (&*It == M2) {
    ++It;
    EXPECT_EQ(&*It, M3);
  } else {
    EXPECT_EQ(&*It, M3);
    ++It;
    EXPECT_EQ(&*It, M2);
  }
  ++It;
  EXPECT_EQ(&*It, M1);
}

TEST(Unit_IR, findModules) {
  auto* Ir = IR::Create(Ctx);
  auto* M1 = Ir->addModule(Ctx, "foo");
  auto* M2 = Ir->addModule(Ctx, "bar");
  auto* M3 = Ir->addModule(Ctx, "foo");

  {
    auto F = Ir->findModules("foo");
    EXPECT_EQ(std::distance(F.begin(), F.end()), 2);
    // Order of M1 and M3 is unspecified.
    EXPECT_EQ((std::set<Module*>{&*F.begin(), &*std::next(F.begin(), 1)}),
              (std::set<Module*>{M1, M3}));
  }

  {
    auto F = Ir->findModules("bar");
    EXPECT_EQ(std::distance(F.begin(), F.end()), 1);
    EXPECT_EQ(&*F.begin(), M2);
  }

  EXPECT_TRUE(Ir->findModules("notfound").empty());
}

TEST(Unit_IR, getModulesWithPreferredAddr) {
  const Addr PreferredAddr{22678};
  const size_t ModulesWithAddr{3};
  const size_t ModulesWithoutAddr{5};

  auto* Ir = IR::Create(Ctx);

  std::string ModName = "with_addr0";
  for (size_t I = 0; I < ModulesWithAddr; ++I) {
    ModName[ModName.size() - 1] = '0' + I;
    auto* M = Ir->addModule(Module::Create(Ctx, ModName));
    M->setPreferredAddr(PreferredAddr);
  }

  ModName = "without_addr0";
  for (size_t I = 0; I < ModulesWithoutAddr; ++I) {
    ModName[ModName.size() - 1] = '0' + I;
    Ir->addModule(Module::Create(Ctx, ModName));
  }

  size_t Count = std::count_if(Ir->modules_begin(), Ir->modules_end(),
                               [PreferredAddr](const Module& M) {
                                 return hasPreferredAddr(M, PreferredAddr);
                               });
  EXPECT_FALSE(Count == 0);
  EXPECT_EQ(ModulesWithAddr, Count);
}

TEST(Unit_IR, addAuxData) {
  std::vector<int64_t> AuxData = {1, 2, 3};
  auto* Ir = IR::Create(Ctx);
  Ir->addAuxData<TestVectorInt64>(std::move(AuxData));

  ASSERT_NE(Ir->getAuxData<TestVectorInt64>(), nullptr);
  EXPECT_EQ(*Ir->getAuxData<TestVectorInt64>(),
            std::vector<int64_t>({1, 2, 3}));
}

TEST(Unit_IR, getAuxData) {
  std::vector<int64_t> AuxDataVec = {1, 2, 3};
  std::map<std::string, int64_t> AuxDataMap = {{"foo", 1}, {"bar", 2}};
  auto* Ir = IR::Create(Ctx);
  Ir->addAuxData<FooVectorInt64>(std::move(AuxDataVec));
  Ir->addAuxData<AnAuxDataMap>(std::move(AuxDataMap));

  auto* FooAuxData = Ir->getAuxData<FooVectorInt64>();
  ASSERT_NE(FooAuxData, nullptr);
  EXPECT_EQ(*FooAuxData, std::vector<int64_t>({1, 2, 3}));

  auto* StoredAuxDataMap = Ir->getAuxData<AnAuxDataMap>();
  std::map<std::string, int64_t> ToCompare = {{"foo", 1}, {"bar", 2}};
  std::map<std::string, int64_t> BadToCompare = {{"foo", 1}, {"bar", 3}};
  ASSERT_NE(StoredAuxDataMap, nullptr);
  EXPECT_NE(*StoredAuxDataMap, BadToCompare);
  EXPECT_EQ(*StoredAuxDataMap, ToCompare);
}

TEST(Unit_IR, auxDataRange) {
  auto* Ir = IR::Create(Ctx);
  Ir->addAuxData<FooVectorInt64>(std::vector<int64_t>{1, 2, 3});
  Ir->addAuxData<BarVectorChar>(std::vector<char>{'a', 'b', 'c'});

  auto A = Ir->aux_data();
  EXPECT_EQ(std::distance(A.begin(), A.end()), 2);
  // AuxDatas are sorted by range, but this is an implementation detail
  EXPECT_EQ(A.begin()->Key, "bar vector<char>");
  EXPECT_EQ((++A.begin())->Key, "foo vector<int64_t>");
}

TEST(Unit_IR, missingAuxData) {
  auto* Ir = IR::Create(Ctx);
  EXPECT_EQ(Ir->getAuxData<FooVectorInt64>(), nullptr);
}

TEST(Unit_IR, protobufRoundTrip) {
  using STH = gtirb::SerializationTestHarness;
  std::stringstream ss;
  UUID MainID;

  {
    Context InnerCtx;
    auto* Original = IR::Create(InnerCtx);
    Original->addModule(Module::Create(InnerCtx, "test"));
    Original->addAuxData<TestInt32>(42);

    MainID = Original->modules_begin()->getUUID();
    STH::save(*Original, ss);
  }
  auto* Result = STH::load<IR>(Ctx, ss);

  EXPECT_EQ(Result->modules_begin()->getUUID(), MainID);
  EXPECT_EQ(Result->getAuxDataSize(), 1);
  ASSERT_NE(Result->getAuxData<TestInt32>(), nullptr);
  EXPECT_EQ(*Result->getAuxData<TestInt32>(), 42);
}

TEST(Unit_IR, jsonRoundTrip) {
  UUID MainID;
  std::ostringstream Out;

  {
    Context InnerCtx;
    auto* Original = IR::Create(InnerCtx);
    Original->addModule(Module::Create(InnerCtx, "test"));
    Original->addAuxData<TestInt32>(42);

    MainID = Original->modules_begin()->getUUID();
    Original->saveJSON(Out);
  }
  std::istringstream In(Out.str());
  auto ResultOrErr = IR::loadJSON(Ctx, In);
  ASSERT_TRUE(ResultOrErr);
  auto* Result = *ResultOrErr;

  EXPECT_EQ(Result->modules_begin()->getUUID(), MainID);
  EXPECT_EQ(Result->getAuxDataSize(), 1);
  ASSERT_NE(Result->getAuxData<TestInt32>(), nullptr);
  EXPECT_EQ(*Result->getAuxData<TestInt32>(), 42);
}

// Attempt to load something missing GTIRB's magic number
// prefix.
TEST(Unit_IR, loadNotGTIRB) {
  std::stringstream Stream("JUNK");
  Context C;
  auto Result = IR::load(C, Stream);
  EXPECT_FALSE(Result);
  EXPECT_EQ(Result, gtirb::IR::load_error::NotGTIRB);
  std::stringstream Err;
  Err << Result.getError();
}

// Attempt to load something w/ GTIRB magic but
// invalid GTIRB protobuf version
TEST(Unit_IR, loadWrongVersion) {
  std::stringstream Stream("GTIRB\0\0\255JUNK");
  Context C;
  auto Result = IR::load(C, Stream);
  EXPECT_FALSE(Result);
  EXPECT_EQ(Result, gtirb::IR::load_error::IncorrectVersion);
  std::stringstream Err;
  Err << Result.getError();
}

// Attempt to load something w/ valid GTIRB prefix
// but invalid protobuf content.
TEST(Unit_IR, loadCorruptFile) {
  std::stringstream Stream;
  Stream << "GTIRB";
  Stream << '\0' << '\0';
  Stream << static_cast<uint8_t>(GTIRB_PROTOBUF_VERSION);
  Stream << "JUNK";
  Context C;
  auto Result = IR::load(C, Stream);
  EXPECT_FALSE(Result);
  EXPECT_EQ(Result, gtirb::IR::load_error::CorruptFile);
  std::stringstream Err;
  Err << Result.getError();
}

TEST(Unit_IR, setModuleName) {
  auto* Ir = IR::Create(Ctx);
  auto* M1 = Ir->addModule(Ctx, "a");
  auto* M2 = Ir->addModule(Ctx, "b");
  auto* M3 = Ir->addModule(Ctx, "c");

  M2->setName("d");
  EXPECT_EQ(std::distance(Ir->modules_begin(), Ir->modules_end()), 3);
  auto It = Ir->modules_begin();
  EXPECT_EQ(&*It++, M1);
  EXPECT_EQ(&*It++, M3);
  EXPECT_EQ(&*It++, M2);
}

TEST(Unit_IR, CFG) {
  Module* M1 = Module::Create(Ctx, "a");
  Section* S1 = M1->addSection(Ctx, "a1");
  ByteInterval* BI1 = S1->addByteInterval(Ctx, 10);
  BI1->addBlock<CodeBlock>(Ctx, 0, 10);
  M1->addProxyBlock(Ctx);

  Module* M2 = Module::Create(Ctx, "b");
  Section* S2 = M2->addSection(Ctx, "b2");
  ByteInterval* BI2 = S2->addByteInterval(Ctx, 1);
  BI2->addBlock<DataBlock>(Ctx, 0, 1);
  M2->addProxyBlock(Ctx);

  IR* Ir = IR::Create(Ctx);
  Ir->addModule(M1);
  Ir->addModule(M2);

  {
    auto [Begin, End] = vertices(Ir->getCFG());
    ASSERT_EQ(std::distance(Begin, End), 3);
    EXPECT_EQ((std::set<CfgNode*>{Ir->getCFG()[*std::next(Begin, 0)],
                                  Ir->getCFG()[*std::next(Begin, 1)],
                                  Ir->getCFG()[*std::next(Begin, 2)]}),
              (std::set<CfgNode*>{&*M1->proxy_blocks_begin(),
                                  &*M1->code_blocks_begin(),
                                  &*M2->proxy_blocks_begin()}));
  }

  Ir->removeModule(M1);

  {
    auto [Begin, End] = vertices(Ir->getCFG());
    ASSERT_EQ(std::distance(Begin, End), 1);
    EXPECT_EQ(Ir->getCFG()[*Begin], &*M2->proxy_blocks_begin());
  }

  Ir->addModule(M1);

  {
    auto [Begin, End] = vertices(Ir->getCFG());
    ASSERT_EQ(std::distance(Begin, End), 3);
    EXPECT_EQ((std::set<CfgNode*>{Ir->getCFG()[*std::next(Begin, 0)],
                                  Ir->getCFG()[*std::next(Begin, 1)],
                                  Ir->getCFG()[*std::next(Begin, 2)]}),
              (std::set<CfgNode*>{&*M1->proxy_blocks_begin(),
                                  &*M1->code_blocks_begin(),
                                  &*M2->proxy_blocks_begin()}));
  }

  M1->removeSection(S1);

  {
    auto [Begin, End] = vertices(Ir->getCFG());
    ASSERT_EQ(std::distance(Begin, End), 2);
    EXPECT_EQ((std::set<CfgNode*>{Ir->getCFG()[*std::next(Begin, 0)],
                                  Ir->getCFG()[*std::next(Begin, 1)]}),
              (std::set<CfgNode*>{&*M1->proxy_blocks_begin(),
                                  &*M2->proxy_blocks_begin()}));
  }

  BI1->addBlock<CodeBlock>(Ctx, 0, 5);
  M1->addSection(S1);

  {
    auto [Begin, End] = vertices(Ir->getCFG());
    ASSERT_EQ(std::distance(Begin, End), 4);
    EXPECT_EQ((std::set<CfgNode*>{Ir->getCFG()[*std::next(Begin, 0)],
                                  Ir->getCFG()[*std::next(Begin, 1)],
                                  Ir->getCFG()[*std::next(Begin, 2)],
                                  Ir->getCFG()[*std::next(Begin, 3)]}),
              (std::set<CfgNode*>{&*M1->proxy_blocks_begin(),
                                  &*M1->code_blocks_begin(),
                                  &*std::next(M1->code_blocks_begin()),
                                  &*M2->proxy_blocks_begin()}));
  }

  S1->removeByteInterval(BI1);

  {
    auto [Begin, End] = vertices(Ir->getCFG());
    ASSERT_EQ(std::distance(Begin, End), 2);
    EXPECT_EQ((std::set<CfgNode*>{Ir->getCFG()[*std::next(Begin, 0)],
                                  Ir->getCFG()[*std::next(Begin, 1)]}),
              (std::set<CfgNode*>{&*M1->proxy_blocks_begin(),
                                  &*M2->proxy_blocks_begin()}));
  }

  S1->addByteInterval(BI1);

  {
    auto [Begin, End] = vertices(Ir->getCFG());
    ASSERT_EQ(std::distance(Begin, End), 4);
    EXPECT_EQ((std::set<CfgNode*>{Ir->getCFG()[*std::next(Begin, 0)],
                                  Ir->getCFG()[*std::next(Begin, 1)],
                                  Ir->getCFG()[*std::next(Begin, 2)],
                                  Ir->getCFG()[*std::next(Begin, 3)]}),
              (std::set<CfgNode*>{&*M1->proxy_blocks_begin(),
                                  &*M1->code_blocks_begin(),
                                  &*std::next(M1->code_blocks_begin()),
                                  &*M2->proxy_blocks_begin()}));
  }
}


================================================
FILE: src/test/Main.test.cpp
================================================
#include "Main.test.hpp"
#include <gtirb/Context.hpp>
#include <gtirb/IR.hpp>
#include <chrono>
#include <fstream>
#include <gtest/gtest.h>
#include <string>
#include <thread>

void registerAuxDataContainerTestAuxDataTypes();
void registerIrTestAuxDataTypes();
void registerModuleTestAuxDataTypes();

static gtirb::Context Ctx;

// This is a GTIRB IR provided by the separate test program
// PrepTestGTIRB.
static gtirb::IR* TestIr = nullptr;

const gtirb::IR* getTestIr() { return TestIr; }

static void loadTestIr(std::string Filename) {
  std::ifstream GtirbFile;
  GtirbFile.open(Filename, std::ifstream::in | std::ifstream::binary);

  if (GtirbFile) {
    auto MaybeTestIr = gtirb::IR::load(Ctx, GtirbFile);
    if (MaybeTestIr) {
      TestIr = *MaybeTestIr;
    }
  }
  GtirbFile.close();
}

int main(int argc, char** argv) {
  // Register aux data types needed by testing
  registerAuxDataContainerTestAuxDataTypes();
  registerIrTestAuxDataTypes();
  registerModuleTestAuxDataTypes();

  // Expect a gtirb filename passed as argv[1]
  std::string GtirbFilename;
  if (argc >= 2) {
    GtirbFilename = argv[1];
  }

  std::stringstream error_msgs;
  if (GtirbFilename.empty()) {
    error_msgs << "*\n* No pre-built GTIRB file specified, cross-process tests "
                  "will fail!\n*\n";
  } else {
    loadTestIr(GtirbFilename);
  }

  ::testing::InitGoogleTest(&argc, argv);
  auto rv = RUN_ALL_TESTS();
  std::cerr << error_msgs.str();
  return rv;
}


================================================
FILE: src/test/Main.test.hpp
================================================
#ifndef MAIN_TEST_HPP
#define MAIN_TEST_HPP

namespace gtirb {
class IR;
};
// Utility for getting a handle to a previously build GTIRB IR.
const gtirb::IR* getTestIr();

#endif // MAIN_TEST_HPP


================================================
FILE: src/test/MergeSortedIterator.test.cpp
================================================
//===- MergeSortedIterator.test.cpp -----------------------------*- C++ -*-===//
//
//  Copyright (C) 2020 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
#include <gtirb/Utility.hpp>
#include <boost/range/iterator_range.hpp>
#include <gtest/gtest.h>
#include <vector>

using namespace gtirb;

TEST(Unit_MergeSortedIterator, testCtor0) {
  MergeSortedIterator<std::vector<int>::iterator> MSI;
}

TEST(Unit_MergeSortedIterator, testCtor1) {
  using Vector = std::vector<int>;
  using VectorIt = Vector::iterator;

  Vector Evens = {2, 4, 6, 8};
  Vector Odds = {1, 3, 5, 7};
  std::vector<boost::iterator_range<VectorIt>> Its = {
      boost::make_iterator_range(Evens), boost::make_iterator_range(Odds)};

  MergeSortedIterator<std::vector<int>::iterator> Begin{Its};
  MergeSortedIterator<std::vector<int>::iterator> End;

  Vector Combined = {1, 2, 3, 4, 5, 6, 7, 8};
  auto ExpectedIt = Combined.begin();
  auto GotIt = Begin;
  while (ExpectedIt != Combined.end() && GotIt != End) {
    ASSERT_EQ(*ExpectedIt, *GotIt);
    ++ExpectedIt;
    ++GotIt;
  }
  ASSERT_EQ(ExpectedIt, Combined.end());
  ASSERT_EQ(GotIt, End);
}

TEST(Unit_MergeSortedIterator, testCtor2) {
  using Vector = std::vector<int>;
  using VectorIt = Vector::iterator;

  Vector Evens = {2, 4, 6, 8};
  Vector Odds = {1, 3, 5, 7};
  std::vector<boost::iterator_range<VectorIt>> Its = {
      boost::make_iterator_range(Evens), boost::make_iterator_range(Odds)};

  MergeSortedIterator<std::vector<int>::iterator> Begin{Its.begin(), Its.end()};
  MergeSortedIterator<std::vector<int>::iterator> End;

  Vector Combined = {1, 2, 3, 4, 5, 6, 7, 8};
  auto ExpectedIt = Combined.begin();
  auto GotIt = Begin;
  while (ExpectedIt != Combined.end() && GotIt != End) {
    ASSERT_EQ(*ExpectedIt, *GotIt);
    ++ExpectedIt;
    ++GotIt;
  }
  ASSERT_EQ(ExpectedIt, Combined.end());
  ASSERT_EQ(GotIt, End);
}

struct CustomCompare {
  bool operator()(int x, int y) const { return x >= y; }
};

TEST(Unit_MergeSortedIterator, testCustomCompare) {
  using Vector = std::vector<int>;
  using VectorIt = Vector::iterator;

  Vector Evens = {8, 6, 4, 2};
  Vector Odds = {7, 5, 3, 1};
  std::vector<boost::iterator_range<VectorIt>> Its = {
      boost::make_iterator_range(Evens), boost::make_iterator_range(Odds)};

  MergeSortedIterator<std::vector<int>::iterator, CustomCompare> Begin{Its};
  MergeSortedIterator<std::vector<int>::iterator, CustomCompare> End;

  Vector Combined = {8, 7, 6, 5, 4, 3, 2, 1};
  auto ExpectedIt = Combined.begin();
  auto GotIt = Begin;
  while (ExpectedIt != Combined.end() && GotIt != End) {
    ASSERT_EQ(*ExpectedIt, *GotIt);
    ++ExpectedIt;
    ++GotIt;
  }
  ASSERT_EQ(ExpectedIt, Combined.end());
  ASSERT_EQ(GotIt, End);
}

TEST(Unit_MergeSortedIterator, testEmptyRanges) {
  using Vector = std::vector<int>;
  using VectorIt = Vector::iterator;

  Vector Evens = {2, 4, 6, 8};
  Vector Empty = {};
  Vector Odds = {1, 3, 5, 7};
  std::vector<boost::iterator_range<VectorIt>> Its = {
      boost::make_iterator_range(Evens), boost::make_iterator_range(Empty),
      boost::make_iterator_range(Odds)};

  MergeSortedIterator<std::vector<int>::iterator> Begin{Its};
  MergeSortedIterator<std::vector<int>::iterator> End;

  Vector Combined = {1, 2, 3, 4, 5, 6, 7, 8};
  auto ExpectedIt = Combined.begin();
  auto GotIt = Begin;
  while (ExpectedIt != Combined.end() && GotIt != End) {
    ASSERT_EQ(*ExpectedIt, *GotIt);
    ++ExpectedIt;
    ++GotIt;
  }
  ASSERT_EQ(ExpectedIt, Combined.end());
  ASSERT_EQ(GotIt, End);
}


================================================
FILE: src/test/Module.test.cpp
================================================
//===- Module.test.cpp ------------------------------------------*- C++ -*-===//
//
//  Copyright (C) 2021 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
#include "SerializationTestHarness.hpp"
#include <gtirb/AuxData.hpp>
#include <gtirb/CodeBlock.hpp>
#include <gtirb/Context.hpp>
#include <gtirb/DataBlock.hpp>
#include <gtirb/IR.hpp>
#include <gtirb/Module.hpp>
#include <gtirb/Section.hpp>
#include <gtirb/Symbol.hpp>
#include <gtirb/SymbolicExpression.hpp>
#include <gtirb/proto/Module.pb.h>
#include <algorithm>
#include <gtest/gtest.h>
#include <iterator>
#include <sstream>
#include <tuple>
#include <utility>

namespace gtirb {
namespace schema {

struct Foo {
  static constexpr const char* Name = "foo";
  typedef std::vector<int64_t> Type;
};

struct Bar {
  static constexpr const char* Name = "bar";
  typedef std::vector<char> Type;
};

struct AnTest {
  static constexpr const char* Name = "test";
  typedef uint32_t Type;
};

} // namespace schema
} // namespace gtirb

using namespace gtirb;
using namespace gtirb::schema;

void registerModuleTestAuxDataTypes() {
  AuxDataContainer::registerAuxDataType<Foo>();
  AuxDataContainer::registerAuxDataType<Bar>();
  AuxDataContainer::registerAuxDataType<AnTest>();
}

TEST(Unit_Module, compilationIteratorTypes) {
  static_assert(
      std::is_same_v<Module::code_block_iterator::reference, CodeBlock&>);
  static_assert(std::is_same_v<Module::const_code_block_iterator::reference,
                               const CodeBlock&>);
  static_assert(std::is_same_v<Module::code_block_subrange::iterator::reference,
                               CodeBlock&>);
  static_assert(
      std::is_same_v<Module::const_code_block_subrange::iterator::reference,
                     const CodeBlock&>);

  static_assert(
      std::is_same_v<Module::data_block_iterator::reference, DataBlock&>);
  static_assert(std::is_same_v<Module::const_data_block_iterator::reference,
                               const DataBlock&>);
  static_assert(std::is_same_v<Module::data_block_subrange::iterator::reference,
                               DataBlock&>);
  static_assert(
      std::is_same_v<Module::const_data_block_subrange::iterator::reference,
                     const DataBlock&>);

  static_assert(std::is_same_v<Module::section_iterator::reference, Section&>);
  static_assert(std::is_same_v<Module::const_section_iterator::reference,
                               const Section&>);
  static_assert(
      std::is_same_v<Module::section_name_iterator::reference, Section&>);
  static_assert(std::is_same_v<Module::const_section_name_iterator::reference,
                               const Section&>);
  static_assert(
      std::is_same_v<Module::section_subrange::iterator::reference, Section&>);
  static_assert(
      std::is_same_v<Module::const_section_subrange::iterator::reference,
                     const Section&>);

  static_assert(std::is_same_v<Module::symbolic_expression_iterator::reference,
                               ByteInterval::SymbolicExpressionElement>);
  static_assert(
      std::is_same_v<Module::const_symbolic_expression_iterator::reference,
                     ByteInterval::ConstSymbolicExpressionElement>);

  static_assert(std::is_same_v<Module::symbol_iterator::reference, Symbol&>);
  static_assert(
      std::is_same_v<Module::const_symbol_iterator::reference, const Symbol&>);
  static_assert(
      std::is_same_v<Module::symbol_addr_iterator::reference, Symbol&>);
  static_assert(std::is_same_v<Module::const_symbol_addr_iterator::reference,
                               const Symbol&>);
}

TEST(Unit_Module, noCopyMoveConstructors) {
  EXPECT_FALSE(std::is_copy_constructible_v<Module>);
  EXPECT_FALSE(std::is_move_constructible_v<Module>);
  EXPECT_FALSE(std::is_copy_assignable_v<Module>);
  EXPECT_FALSE(std::is_move_assignable_v<Module>);
}

static Context Ctx;

TEST(Unit_Module, ctor_0) { EXPECT_NE(Module::Create(Ctx, "M"), nullptr); }

TEST(Unit_Module, setBinaryPath) {
  const std::string StrPath("/home/gt/irb/foo");
  auto* M = Module::Create(Ctx, "M");

  M->setBinaryPath(StrPath);

  const auto& Path = M->getBinaryPath();
  EXPECT_EQ(StrPath, Path);
}

TEST(Unit_Module, getFileFormatDefault) {
  auto* M = Module::Create(Ctx, "M");
  EXPECT_EQ(gtirb::FileFormat::Undefined, M->getFileFormat());
}

TEST(Unit_Module, auxDataRanges) {
  auto* M = Module::Create(Ctx, "M");
  M->addAuxData<Foo>(std::vector<int64_t>{1, 2, 3});
  M->addAuxData<Bar>(std::vector<char>{'a', 'b', 'c'});

  auto A = M->aux_data();
  EXPECT_EQ(std::distance(A.begin(), A.end()), 2);
  // AuxDatas are sorted by range, but this is an implementation detail
  EXPECT_EQ(A.begin()->Key, Bar::Name);
  EXPECT_EQ((++A.begin())->Key, Foo::Name);
}

TEST(Unit_Module, setFileFormat) {
  auto* M = Module::Create(Ctx, "M");

  M->setFileFormat(gtirb::FileFormat::COFF);
  EXPECT_EQ(gtirb::FileFormat::COFF, M->getFileFormat());

  M->setFileFormat(gtirb::FileFormat::MACHO);
  EXPECT_EQ(gtirb::FileFormat::MACHO, M->getFileFormat());

  M->setFileFormat(gtirb::FileFormat::Undefined);
  EXPECT_EQ(gtirb::FileFormat::Undefined, M->getFileFormat());
}

TEST(Unit_Module, getRebaseDeltaDefault) {
  auto* M = Module::Create(Ctx, "M");
  EXPECT_EQ(int64_t{0}, M->getRebaseDelta());
}

TEST(Unit_Module, setRebaseDelta) {
  auto* M = Module::Create(Ctx, "M");

  EXPECT_FALSE(M->isRelocated());

  M->setRebaseDelta(1);
  EXPECT_EQ(int64_t{1}, M->getRebaseDelta());
  EXPECT_TRUE(M->isRelocated());

  M->setRebaseDelta(-1);
  EXPECT_EQ(int64_t{-1}, M->getRebaseDelta());
  EXPECT_TRUE(M->isRelocated());

  M->setRebaseDelta(std::numeric_limits<int64_t>::max());
  EXPECT_EQ(std::numeric_limits<int64_t>::max(), M->getRebaseDelta());
  EXPECT_TRUE(M->isRelocated());

  M->setRebaseDelta(std::numeric_limits<int64_t>::min());
  EXPECT_EQ(std::numeric_limits<int64_t>::min(), M->getRebaseDelta());
  EXPECT_TRUE(M->isRelocated());

  M->setRebaseDelta(std::numeric_limits<int64_t>::lowest());
  EXPECT_EQ(std::numeric_limits<int64_t>::lowest(), M->getRebaseDelta());
  EXPECT_TRUE(M->isRelocated());
}

TEST(Unit_Module, getPreferredAddrDefault) {
  auto* M = Module::Create(Ctx, "M");
  EXPECT_EQ(Addr{}, M->getPreferredAddr());
}

TEST(Unit_Module, getISA) {
  auto* M = Module::Create(Ctx, "M");

  EXPECT_EQ(gtirb::ISA::Undefined, M->getISA());

  M->setISA(gtirb::ISA::X64);
  EXPECT_EQ(gtirb::ISA::X64, M->getISA());
}

TEST(Unit_Module, getByteOrder) {
  auto* M = Module::Create(Ctx, "M");

  EXPECT_EQ(gtirb::ByteOrder::Undefined, M->getByteOrder());

  M->setByteOrder(gtirb::ByteOrder::Big);
  EXPECT_EQ(gtirb::ByteOrder::Big, M->getByteOrder());
}

TEST(Unit_Module, setPreferredAddr) {
  auto* M = Module::Create(Ctx, "M");
  Addr Preferred{64};

  EXPECT_EQ(M->getPreferredAddr(), Addr(0));

  M->setPreferredAddr(Preferred);
  EXPECT_EQ(Preferred, M->getPreferredAddr());
}

TEST(Unit_Module, getSymbolSet) {
  auto* M = Module::Create(Ctx, "M");
  EXPECT_EQ(std::distance(M->symbols().begin(), M->symbols().end()), 0);
}

TEST(Unit_Module, getName) {
  auto* M = Module::Create(Ctx, "M");
  EXPECT_EQ(M->getName(), "M");
}

TEST(Unit_Module, setName) {
  auto* M = Module::Create(Ctx, "M");
  EXPECT_EQ(M->getName(), "M");

  M->setName("test");
  EXPECT_EQ(M->getName(), "test");
}

TEST(Unit_Module, sections) {
  auto* M = Module::Create(Ctx, "M");
  M->addSection(Ctx, "test");
  EXPECT_EQ(M->sections_begin()->getName(), "test");
  EXPECT_EQ(std::distance(M->sections_begin(), M->sections_end()), 1);
  EXPECT_EQ(
      std::distance(M->sections_by_name_begin(), M->sections_by_name_end()), 1);
}

TEST(Unit_Module, byteIntervals) {
  auto* M = Module::Create(Ctx, "M");
  auto* S1 = M->addSection(Ctx, "gamma");
  auto* S2 = M->addSection(Ctx, "beta");
  auto* S3 = M->addSection(Ctx, "alpha");
  auto* BI1 = S1->addByteInterval(Ctx, 10);
  auto* BI2 = S2->addByteInterval(Ctx, Addr(0), 10);
  auto* BI3 = S3->addByteInterval(Ctx, Addr(10), 10);

  // Create CodeBlocks and Symbols such that pointers do not change
  // monotonically with respect to address. This will help determine whether
  // CodeBlock and Symbol iteration is updated properly when ByteIntervals are
  // relocated.

  CodeBlock* CB[20];
  Symbol* Sym[20];
  for (int i = 0; i < 10; ++i) {
    int index = (i & 0x1) ? 4 - (i >> 1) : 5 + (i >> 1);
    CB[index] = BI2->addBlock<CodeBlock>(Ctx, index, 1);
    CB[index + 10] = BI3->addBlock<CodeBlock>(Ctx, index, 1);

    std::string name = "sym_";
    Sym[index] = M->addSymbol(Ctx, CB[index], name.append(1, 'a' + index));
    Sym[index + 10] =
        M->addSymbol(Ctx, CB[index + 10], name.append(1, 'a' + index + 10));
  }
  for (int i = 0; i < 20; ++i) {
    ASSERT_EQ(CB[i]->getAddress(), Addr(i));
    ASSERT_EQ(Sym[i]->getAddress(), Addr(i));
  }

  // Iteration should be in order of increasing start address.
  ASSERT_EQ(std::distance(M->byte_intervals_begin(), M->byte_intervals_end()),
            3);
  EXPECT_EQ(&*std::next(M->byte_intervals_begin(), 0), BI1);
  EXPECT_EQ(&*std::next(M->byte_intervals_begin(), 1), BI2);
  EXPECT_EQ(&*std::next(M->byte_intervals_begin(), 2), BI3);

  ASSERT_EQ(std::distance(M->sections_begin(), M->sections_end()), 3);
  EXPECT_EQ(&*std::next(M->sections_begin(), 0), S1);
  EXPECT_EQ(&*std::next(M->sections_begin(), 1), S2);
  EXPECT_EQ(&*std::next(M->sections_begin(), 2), S3);

  // CodeBlocks and symbols should be in order.
  ASSERT_EQ(std::distance(M->code_blocks_begin(), M->code_blocks_end()), 20);
  for (int i = 0; i < 20; ++i) {
    CodeBlock& CBi = *std::next(M->code_blocks_begin(), i);
    EXPECT_EQ(CBi.getAddress(), Addr(i));
    EXPECT_EQ(&CBi, CB[i]);
  }

  ASSERT_EQ(std::distance(M->symbols_by_addr_begin(), M->symbols_by_addr_end()),
            20);
  for (int i = 0; i < 20; ++i) {
    Symbol& S = *std::next(M->symbols_by_addr_begin(), i);
    EXPECT_EQ(S.getAddress(), Addr(i));
    EXPECT_EQ(&S, Sym[i]);
  }

  // Iteration should be alphabetical by section name.
  ASSERT_EQ(
      std::distance(M->sections_by_name_begin(), M->sections_by_name_end()), 3);
  EXPECT_EQ(&*std::next(M->sections_by_name_begin(), 0), S3);
  EXPECT_EQ(&*std::next(M->sections_by_name_begin(), 1), S2);
  EXPECT_EQ(&*std::next(M->sections_by_name_begin(), 2), S1);

  BI2->setAddress(Addr(20));

  // BI2 should now come last...
  ASSERT_EQ(std::distance(M->byte_intervals_begin(), M->byte_intervals_end()),
            3);
  EXPECT_EQ(&*std::next(M->byte_intervals_begin(), 0), BI1);
  EXPECT_EQ(&*std::next(M->byte_intervals_begin(), 1), BI3);
  EXPECT_EQ(&*std::next(M->byte_intervals_begin(), 2), BI2);

  ASSERT_EQ(std::distance(M->sections_begin(), M->sections_end()), 3);
  EXPECT_EQ(&*std::next(M->sections_begin(), 0), S1);
  EXPECT_EQ(&*std::next(M->sections_begin(), 1), S3);
  EXPECT_EQ(&*std::next(M->sections_begin(), 2), S2);

  // The first 10 CodeBlocks and Symbols (in BI2) should come after the second
  // 10 (in BI3).
  ASSERT_EQ(std::distance(M->code_blocks_begin(), M->code_blocks_end()), 20);
  for (int i = 0; i < 10; ++i) {
    CodeBlock& CBi = *std::next(M->code_blocks_begin(), i);
    EXPECT_EQ(CBi.getAddress(), Addr(i + 10));
    EXPECT_EQ(&CBi, CB[i + 10]);
  }
  for (int i = 0; i < 10; ++i) {
    CodeBlock& CBi = *std::next(M->code_blocks_begin(), i + 10);
    EXPECT_EQ(CBi.getAddress(), Addr(i + 20));
    EXPECT_EQ(&CBi, CB[i]);
  }

  ASSERT_EQ(std::distance(M->symbols_by_addr_begin(), M->symbols_by_addr_end()),
            20);
  for (int i = 0; i < 10; ++i) {
    Symbol& S = *std::next(M->symbols_by_addr_begin(), i);
    EXPECT_EQ(S.getAddress(), Addr(i + 10));
    EXPECT_EQ(&S, Sym[i + 10]);
  }
  for (int i = 0; i < 10; ++i) {
    Symbol& S = *std::next(M->symbols_by_addr_begin(), i + 10);
    EXPECT_EQ(S.getAddress(), Addr(i + 20));
    EXPECT_EQ(&S, Sym[i]);
  }

  // Iteration should be unaffected by changing addresses...
  ASSERT_EQ(
      std::distance(M->sections_by_name_begin(), M->sections_by_name_end()), 3);
  EXPECT_EQ(&*std::next(M->sections_by_name_begin(), 0), S3);
  EXPECT_EQ(&*std::next(M->sections_by_name_begin(), 1), S2);
  EXPECT_EQ(&*std::next(M->sections_by_name_begin(), 2), S1);
}

TEST(Unit_Module, findByteIntervalsOn) {
  auto* M = Module::Create(Ctx, "test");
  auto* S1 = M->addSection(Ctx, "S1");
  auto* BI1 = S1->addByteInterval(Ctx, 16);
  auto* S2 = M->addSection(Ctx, "S2");
  auto* BI2 = S2->addByteInterval(Ctx, Addr(8), 12);
  auto* S3 = M->addSection(Ctx, "S3");
  auto* BI3 = S3->addByteInterval(Ctx, Addr(13), 8);
  const Module* CM = M;

  // Querying an out-of-bounds address returns an empty range.

  auto Range = M->findByteIntervalsOn(Addr(0));
  EXPECT_TRUE(Range.empty());

  auto ConstRange = CM->findByteIntervalsOn(Addr(0));
  EXPECT_TRUE(Range.empty());

  // Querying a in-bounds address returns the correct range.

  Range = M->findByteIntervalsOn(Addr(12));
  ASSERT_EQ(std::distance(Range.begin(), Range.end()), 1);
  EXPECT_EQ(&*Range.begin(), BI2);

  ConstRange = CM->findByteIntervalsOn(Addr(12));
  ASSERT_EQ(std::distance(ConstRange.begin(), ConstRange.end()), 1);
  EXPECT_EQ(&*ConstRange.begin(), BI2);

  // Query returns correct set after addresses are updated.

  BI1->setAddress(Addr(0));
  Range = M->findByteIntervalsOn(Addr(0));
  ASSERT_EQ(std::distance(Range.begin(), Range.end()), 1);
  EXPECT_EQ(&*Range.begin(), BI1);

  ConstRange = CM->findByteIntervalsOn(Addr(0));
  ASSERT_EQ(std::distance(ConstRange.begin(), ConstRange.end()), 1);
  EXPECT_EQ(&*ConstRange.begin(), BI1);

  Range = M->findByteIntervalsOn(Addr(12));
  ASSERT_EQ(std::distance(Range.begin(), Range.end()), 2);
  EXPECT_EQ(&*std::next(Range.begin(), 0), BI1);
  EXPECT_EQ(&*std::next(Range.begin(), 1), BI2);

  ConstRange = CM->findByteIntervalsOn(Addr(12));
  ASSERT_EQ(std::distance(ConstRange.begin(), ConstRange.end()), 2);
  EXPECT_EQ(&*std::next(ConstRange.begin(), 0), BI1);
  EXPECT_EQ(&*std::next(ConstRange.begin(), 1), BI2);

  // Query is correct for ByteIntervals with overlapping start addresses.

  BI1->setAddress(Addr(13));
  Range = M->findByteIntervalsOn(Addr(14));
  ASSERT_EQ(std::distance(Range.begin(), Range.end()), 3);
  EXPECT_EQ(&*std::next(Range.begin(), 0), BI2);
  EXPECT_EQ(&*std::next(Range.begin(), 1), BI3);
  EXPECT_EQ(&*std::next(Range.begin(), 2), BI1);

  ConstRange = CM->findByteIntervalsOn(Addr(14));
  ASSERT_EQ(std::distance(ConstRange.begin(), ConstRange.end()), 3);
  EXPECT_EQ(&*std::next(ConstRange.begin(), 0), BI2);
  EXPECT_EQ(&*std::next(ConstRange.begin(), 1), BI3);
  EXPECT_EQ(&*std::next(ConstRange.begin(), 2), BI1);

  // Moving a ByteInterval does not leave duplicates in codomain tree.

  BI2->setAddress(Addr(13));
  Range = M->findByteIntervalsOn(Addr(14));
  ASSERT_EQ(std::distance(Range.begin(), Range.end()), 3);
  EXPECT_EQ(&*std::next(Range.begin(), 0), BI3);
  EXPECT_EQ(&*std::next(Range.begin(), 1), BI2);
  EXPECT_EQ(&*std::next(Range.begin(), 2), BI1);

  ConstRange = CM->findByteIntervalsOn(Addr(14));
  ASSERT_EQ(std::distance(ConstRange.begin(), ConstRange.end()), 3);
  EXPECT_EQ(&*std::next(ConstRange.begin(), 0), BI3);
  EXPECT_EQ(&*std::next(ConstRange.begin(), 1), BI2);
  EXPECT_EQ(&*std::next(ConstRange.begin(), 2), BI1);

  // Removing a ByteInterval with an overlapping address does not remove others.

  BI3->setAddress(std::nullopt);
  Range = M->findByteIntervalsOn(Addr(14));
  ASSERT_EQ(std::distance(Range.begin(), Range.end()), 2);
  EXPECT_EQ(&*std::next(Range.begin(), 0), BI2);
  EXPECT_EQ(&*std::next(Range.begin(), 1), BI1);

  ConstRange = CM->findByteIntervalsOn(Addr(14));
  ASSERT_EQ(std::distance(ConstRange.begin(), ConstRange.end()), 2);
  EXPECT_EQ(&*std::next(ConstRange.begin(), 0), BI2);
  EXPECT_EQ(&*std::next(ConstRange.begin(), 1), BI1);
}

TEST(Unit_Module, findSections) {
  auto* M = Module::Create(Ctx, "M");
  auto* S1 = M->addSection(Ctx, "S1");
  auto* S2 = M->addSection(Ctx, "S2");
  auto* S22 = M->addSection(Ctx, "S2");
  auto* S3 = M->addSection(Ctx, "S3");
  auto* BI1 = S1->addByteInterval(Ctx, Addr(1), 123);
  auto* BI2 = S2->addByteInterval(Ctx, 100);
  S3->addByteInterval(Ctx, Addr(50), 50);
  S22->addByteInterval(Ctx, Addr(2), 22);

  {
    auto F = M->findSectionsOn(Addr(1));
    ASSERT_EQ(std::distance(F.begin(), F.end()), 1);
    EXPECT_EQ(F.begin()->getName(), "S1");

    F = M->findSectionsOn(Addr(50));
    ASSERT_EQ(std::distance(F.begin(), F.end()), 2);
    EXPECT_EQ(std::next(F.begin(), 0)->getName(), "S1");
    EXPECT_EQ(std::next(F.begin(), 1)->getName(), "S3");

    F = M->findSectionsOn(Addr(123));
    ASSERT_EQ(std::distance(F.begin(), F.end()), 1);
    EXPECT_EQ(F.begin()->getName(), "S1");

    F = M->findSectionsOn(Addr(124));
    EXPECT_EQ(std::distance(F.begin(), F.end()), 0);
  }

  BI2->setAddress(Addr(50));

  {
    auto F = M->findSectionsOn(Addr(1));
    EXPECT_EQ(std::distance(F.begin(), F.end()), 1);
    EXPECT_EQ(std::next(F.begin(), 0)->getName(), "S1");

    F = M->findSectionsOn(Addr(50));
    ASSERT_EQ(std::distance(F.begin(), F.end()), 3);
    EXPECT_EQ(std::next(F.begin(), 0)->getName(), "S1");
    EXPECT_EQ(std::next(F.begin(), 1)->getName(), "S3");
    EXPECT_EQ(std::next(F.begin(), 2)->getName(), "S2");
  }

  BI1->setAddress(Addr(50));

  {
    auto F = M->findSectionsOn(Addr(1));
    EXPECT_EQ(std::distance(F.begin(), F.end()), 0);

    F = M->findSectionsOn(Addr(50));
    ASSERT_EQ(std::distance(F.begin(), F.end()), 3);
    EXPECT_EQ(std::next(F.begin(), 0)->getName(), "S3");
    EXPECT_EQ(std::next(F.begin(), 1)->getName(), "S2");
    EXPECT_EQ(std::next(F.begin(), 2)->getName(), "S1");
  }

  BI1->setAddress(std::nullopt);

  {
    auto F = M->findSectionsOn(Addr(1));
    EXPECT_EQ(std::distance(F.begin(), F.end()), 0);

    F = M->findSectionsOn(Addr(50));
    ASSERT_EQ(std::distance(F.begin(), F.end()), 2);
    EXPECT_EQ(std::next(F.begin(), 0)->getName(), "S3");
    EXPECT_EQ(std::next(F.begin(), 1)->getName(), "S2");
  }

  {
    auto F = M->findSections("S1");
    ASSERT_EQ(std::distance(F.begin(), F.end()), 1);
    EXPECT_EQ(std::next(F.begin(), 0)->getName(), "S1");

    F = M->findSections("S2");
    ASSERT_EQ(std::distance(F.begin(), F.end()), 2);
    EXPECT_EQ(std::next(F.begin(), 0)->getName(), "S2");
    EXPECT_EQ(std::next(F.begin(), 1)->getName(), "S2");

    F = M->findSections("dummy");
    ASSERT_EQ(std::distance(F.begin(), F.end()), 0);
  }
}

TEST(Unit_Module, sectionNameOrder) {
  auto* M = Module::Create(Ctx, "M");
  auto* S1 = M->addSection(Ctx, "gamma");
  auto* S2 = M->addSection(Ctx, "beta");
  auto* S3 = M->addSection(Ctx, "alpha");

  ASSERT_EQ(
      std::distance(M->sections_by_name_begin(), M->sections_by_name_end()), 3);
  EXPECT_EQ(&*std::next(M->sections_by_name_begin(), 0), S3); // alpha
  EXPECT_EQ(&*std::next(M->sections_by_name_begin(), 1), S2); // beta
  EXPECT_EQ(&*std::next(M->sections_by_name_begin(), 2), S1); // gamma

  S2->setName("omega");
  ASSERT_EQ(
      std::distance(M->sections_by_name_begin(), M->sections_by_name_end()), 3);
  EXPECT_EQ(&*std::next(M->sections_by_name_begin(), 0), S3); // alpha
  EXPECT_EQ(&*std::next(M->sections_by_name_begin(), 1), S1); // gamma
  EXPECT_EQ(&*std::next(M->sections_by_name_begin(), 2), S2); // omega
}

TEST(Unit_Module, blocks) {
  auto I = IR::Create(Ctx);
  auto M = I->addModule(Ctx, "M");
  auto S = M->addSection(Ctx, "test");
  auto BI = S->addByteInterval(Ctx, Addr(1), 10);
  BI->addBlock<CodeBlock>(Ctx, 0, 10);

  ASSERT_EQ(std::distance(M->code_blocks_begin(), M->code_blocks_end()), 1);
  EXPECT_EQ(M->code_blocks_begin()->getAddress(), std::optional<Addr>(Addr(1)));

  auto F = blocks(M->getIR()->getCFG());
  ASSERT_EQ(std::distance(F.begin(), F.end()), 1);
  EXPECT_EQ(F.begin()->getAddress(), Addr(1));
}

TEST(Unit_Module, cfgNodes) {
  auto* I = IR::Create(Ctx);
  auto* M = I->addModule(Ctx, "M");
  auto S = M->addSection(Ctx, "test");
  auto BI = S->addByteInterval(Ctx, Addr(1), 10);
  auto* B = BI->addBlock<CodeBlock>(Ctx, 0, 10);
  auto* P = M->addProxyBlock(Ctx);

  EXPECT_EQ(std::distance(M->code_blocks_begin(), M->code_blocks_end()), 1);
  auto Nodes = nodes(M->getIR()->getCFG());
  EXPECT_EQ(std::distance(Nodes.begin(), Nodes.end()), 2);
  auto It = Nodes.begin();
  EXPECT_TRUE(&*It == B || &*It == P);
  ++It;
  EXPECT_NE(&*Nodes.begin(), &*It);
  EXPECT_TRUE(&*It == B || &*It == P);
}

TEST(Unit_Module, findBlock) {
  auto* M = Module::Create(Ctx, "M");
  auto* S = M->addSection(Ctx, "test");
  auto* BI = S->addByteInterval(Ctx, Addr(0), 30);
  auto* B1 = BI->addBlock<CodeBlock>(Ctx, 1, 20);
  auto* B2 = BI->addBlock<CodeBlock>(Ctx, 5, 10);

  {
    auto F = M->findCodeBlocksOn(Addr(0));
    EXPECT_EQ(std::distance(F.begin(), F.end()), 0);

    F = M->findCodeBlocksOn(Addr(1));
    ASSERT_EQ(std::distance(F.begin(), F.end()), 1);
    EXPECT_EQ(&*F.begin(), B1);

    F = M->findCodeBlocksOn(Addr(5));
    ASSERT_EQ(std::distance(F.begin(), F.end()), 2);
    EXPECT_EQ(&*F.begin(), B1);
    EXPECT_EQ(&*++F.begin(), B2);

    F = M->findCodeBlocksOn(Addr(14));
    ASSERT_EQ(std::distance(F.begin(), F.end()), 2);
    EXPECT_EQ(&*F.begin(), B1);
    EXPECT_EQ(&*++F.begin(), B2);

    F = M->findCodeBlocksOn(Addr(15));
    ASSERT_EQ(std::distance(F.begin(), F.end()), 1);
    EXPECT_EQ(&*F.begin(), B1);

    F = M->findCodeBlocksOn(Addr(20));
    ASSERT_EQ(std::distance(F.begin(), F.end()), 1);
    EXPECT_EQ(&*F.begin(), B1);

    F = M->findCodeBlocksOn(Addr(21));
    EXPECT_EQ(std::distance(F.begin(), F.end()), 0);
  }
}

TEST(Unit_Module, findBlocksOn) {
  auto* M = Module::Create(Ctx, "test");
  auto* S1 = M->addSection(Ctx, "S1");
  auto* BI1 = S1->addByteInterval(Ctx, 16);
  auto* CB11 = BI1->addBlock<CodeBlock>(Ctx, 0, 4);
  auto* S2 = M->addSection(Ctx, "S2");
  auto* BI2 = S2->addByteInterval(Ctx, Addr(0), 10);
  auto* CB21 = BI2->addBlock<CodeBlock>(Ctx, 0, 2);
  auto* CB22 = BI2->addBlock<CodeBlock>(Ctx, 5, 2);
  auto* S3 = M->addSection(Ctx, "S3");
  auto* BI3 = S3->addByteInterval(Ctx, Addr(4), 4);
  auto* CB31 = BI3->addBlock<CodeBlock>(Ctx, 0, 3);
  const Module* CM = M;

  // Querying an out-of-bounds offset produces an empty range.

  auto BlockRange = M->findBlocksOn(Addr(10));
  EXPECT_TRUE(BlockRange.empty());

  auto ConstBlockRange = CM->findBlocksOn(Addr(10));
  EXPECT_TRUE(ConstBlockRange.empty());

  // Querying an in-bounds offset returns the appropriate blocks from all
  // ByteIntervals.

  BlockRange = M->findBlocksOn(Addr(5));
  ASSERT_EQ(std::distance(BlockRange.begin(), BlockRange.end()), 2);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 0), CB31);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 1), CB22);

  ConstBlockRange = CM->findBlocksOn(Addr(5));
  ASSERT_EQ(std::distance(ConstBlockRange.begin(), ConstBlockRange.end()), 2);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 0), CB31);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 1), CB22);

  // Assigning a ByteInterval address may change the query results.

  BI1->setAddress(Addr(4));

  BlockRange = M->findBlocksOn(Addr(5));
  ASSERT_EQ(std::distance(BlockRange.begin(), BlockRange.end()), 3);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 0), CB31);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 1), CB11);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 2), CB22);

  ConstBlockRange = CM->findBlocksOn(Addr(5));
  ASSERT_EQ(std::distance(ConstBlockRange.begin(), ConstBlockRange.end()), 3);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 0), CB31);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 1), CB11);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 2), CB22);

  // Changing a ByteInterval's address may change the query results.

  BI2->setAddress(Addr(4));

  BlockRange = M->findBlocksOn(Addr(5));
  ASSERT_EQ(std::distance(BlockRange.begin(), BlockRange.end()), 3);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 0), CB21);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 1), CB31);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 2), CB11);

  ConstBlockRange = CM->findBlocksOn(Addr(5));
  ASSERT_EQ(std::distance(ConstBlockRange.begin(), ConstBlockRange.end()), 3);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 0), CB21);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 1), CB31);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 2), CB11);

  BI3->setAddress(Addr(0));

  BlockRange = M->findBlocksOn(Addr(5));
  ASSERT_EQ(std::distance(BlockRange.begin(), BlockRange.end()), 2);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 0), CB21);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 1), CB11);

  ConstBlockRange = CM->findBlocksOn(Addr(5));
  ASSERT_EQ(std::distance(ConstBlockRange.begin(), ConstBlockRange.end()), 2);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 0), CB21);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 1), CB11);
}

TEST(Unit_Module, findCodeBlocksOn) {
  auto* M = Module::Create(Ctx, "test");
  auto* S1 = M->addSection(Ctx, "S1");
  auto* BI1 = S1->addByteInterval(Ctx, 16);
  auto* CB11 = BI1->addBlock<CodeBlock>(Ctx, 0, 4);
  auto* S2 = M->addSection(Ctx, "S2");
  auto* BI2 = S2->addByteInterval(Ctx, Addr(0), 10);
  auto* CB21 = BI2->addBlock<CodeBlock>(Ctx, 0, 2);
  auto* CB22 = BI2->addBlock<CodeBlock>(Ctx, 5, 2);
  auto* S3 = M->addSection(Ctx, "S3");
  auto* BI3 = S3->addByteInterval(Ctx, Addr(4), 4);
  auto* CB31 = BI3->addBlock<CodeBlock>(Ctx, 0, 3);
  const Module* CM = M;

  // Querying an out-of-bounds offset produces an empty range.

  auto BlockRange = M->findCodeBlocksOn(Addr(10));
  EXPECT_TRUE(BlockRange.empty());

  auto ConstBlockRange = CM->findCodeBlocksOn(Addr(10));
  EXPECT_TRUE(ConstBlockRange.empty());

  // Querying an in-bounds offset returns the appropriate blocks from all
  // ByteIntervals.

  BlockRange = M->findCodeBlocksOn(Addr(5));
  ASSERT_EQ(std::distance(BlockRange.begin(), BlockRange.end()), 2);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 0), CB31);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 1), CB22);

  ConstBlockRange = CM->findCodeBlocksOn(Addr(5));
  ASSERT_EQ(std::distance(ConstBlockRange.begin(), ConstBlockRange.end()), 2);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 0), CB31);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 1), CB22);

  // Assigning a ByteInterval address may change the query results.

  BI1->setAddress(Addr(4));

  BlockRange = M->findCodeBlocksOn(Addr(5));
  ASSERT_EQ(std::distance(BlockRange.begin(), BlockRange.end()), 3);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 0), CB31);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 1), CB11);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 2), CB22);

  ConstBlockRange = CM->findCodeBlocksOn(Addr(5));
  ASSERT_EQ(std::distance(ConstBlockRange.begin(), ConstBlockRange.end()), 3);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 0), CB31);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 1), CB11);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 2), CB22);

  // Changing a ByteInterval's address may change the query results.

  BI2->setAddress(Addr(4));

  BlockRange = M->findCodeBlocksOn(Addr(5));
  ASSERT_EQ(std::distance(BlockRange.begin(), BlockRange.end()), 3);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 0), CB21);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 1), CB31);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 2), CB11);

  ConstBlockRange = CM->findCodeBlocksOn(Addr(5));
  ASSERT_EQ(std::distance(ConstBlockRange.begin(), ConstBlockRange.end()), 3);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 0), CB21);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 1), CB31);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 2), CB11);

  BI3->setAddress(Addr(0));

  BlockRange = M->findCodeBlocksOn(Addr(5));
  ASSERT_EQ(std::distance(BlockRange.begin(), BlockRange.end()), 2);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 0), CB21);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 1), CB11);

  ConstBlockRange = CM->findCodeBlocksOn(Addr(5));
  ASSERT_EQ(std::distance(ConstBlockRange.begin(), ConstBlockRange.end()), 2);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 0), CB21);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 1), CB11);
}

TEST(Unit_Module, findDataBlocksOn) {
  auto* M = Module::Create(Ctx, "test");
  auto* S1 = M->addSection(Ctx, "S1");
  auto* BI1 = S1->addByteInterval(Ctx, 16);
  auto* CB11 = BI1->addBlock<DataBlock>(Ctx, 0, 4);
  auto* S2 = M->addSection(Ctx, "S2");
  auto* BI2 = S2->addByteInterval(Ctx, Addr(0), 10);
  auto* CB21 = BI2->addBlock<DataBlock>(Ctx, 0, 2);
  auto* CB22 = BI2->addBlock<DataBlock>(Ctx, 5, 2);
  auto* S3 = M->addSection(Ctx, "S3");
  auto* BI3 = S3->addByteInterval(Ctx, Addr(4), 4);
  auto* CB31 = BI3->addBlock<DataBlock>(Ctx, 0, 3);
  const Module* CM = M;

  // Querying an out-of-bounds offset produces an empty range.

  auto BlockRange = M->findDataBlocksOn(Addr(10));
  EXPECT_TRUE(BlockRange.empty());

  auto ConstBlockRange = CM->findDataBlocksOn(Addr(10));
  EXPECT_TRUE(ConstBlockRange.empty());

  // Querying an in-bounds offset returns the appropriate blocks from all
  // ByteIntervals.

  BlockRange = M->findDataBlocksOn(Addr(5));
  ASSERT_EQ(std::distance(BlockRange.begin(), BlockRange.end()), 2);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 0), CB31);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 1), CB22);

  ConstBlockRange = CM->findDataBlocksOn(Addr(5));
  ASSERT_EQ(std::distance(ConstBlockRange.begin(), ConstBlockRange.end()), 2);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 0), CB31);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 1), CB22);

  // Assigning a ByteInterval address may change the query results.

  BI1->setAddress(Addr(4));

  BlockRange = M->findDataBlocksOn(Addr(5));
  ASSERT_EQ(std::distance(BlockRange.begin(), BlockRange.end()), 3);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 0), CB31);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 1), CB11);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 2), CB22);

  ConstBlockRange = CM->findDataBlocksOn(Addr(5));
  ASSERT_EQ(std::distance(ConstBlockRange.begin(), ConstBlockRange.end()), 3);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 0), CB31);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 1), CB11);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 2), CB22);

  // Changing a ByteInterval's address may change the query results.

  BI2->setAddress(Addr(4));

  BlockRange = M->findDataBlocksOn(Addr(5));
  ASSERT_EQ(std::distance(BlockRange.begin(), BlockRange.end()), 3);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 0), CB21);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 1), CB31);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 2), CB11);

  ConstBlockRange = CM->findDataBlocksOn(Addr(5));
  ASSERT_EQ(std::distance(ConstBlockRange.begin(), ConstBlockRange.end()), 3);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 0), CB21);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 1), CB31);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 2), CB11);

  BI3->setAddress(Addr(0));

  BlockRange = M->findDataBlocksOn(Addr(5));
  ASSERT_EQ(std::distance(BlockRange.begin(), BlockRange.end()), 2);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 0), CB21);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 1), CB11);

  ConstBlockRange = CM->findDataBlocksOn(Addr(5));
  ASSERT_EQ(std::distance(ConstBlockRange.begin(), ConstBlockRange.end()), 2);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 0), CB21);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 1), CB11);
}

TEST(Unit_Module, findBlocksAt) {
  auto* M = Module::Create(Ctx, "test");
  auto* S1 = M->addSection(Ctx, "S1");
  auto* BI1 = S1->addByteInterval(Ctx, 16);
  auto* CB11 = BI1->addBlock<CodeBlock>(Ctx, 0, 4);
  auto* S2 = M->addSection(Ctx, "S2");
  auto* BI2 = S2->addByteInterval(Ctx, Addr(0), 10);
  auto* CB21 = BI2->addBlock<CodeBlock>(Ctx, 0, 2);
  auto* CB22 = BI2->addBlock<CodeBlock>(Ctx, 5, 2);
  auto* S3 = M->addSection(Ctx, "S3");
  auto* BI3 = S3->addByteInterval(Ctx, Addr(4), 4);
  auto* CB31 = BI3->addBlock<CodeBlock>(Ctx, 0, 3);
  const Module* CM = M;

  // Querying an out-of-bounds offset produces an empty range.

  auto BlockRange = M->findBlocksAt(Addr(10), Addr(11));
  EXPECT_TRUE(BlockRange.empty());

  auto ConstBlockRange = CM->findBlocksAt(Addr(10), Addr(11));
  EXPECT_TRUE(ConstBlockRange.empty());

  // Querying an in-bounds offset returns the appropriate blocks from all
  // ByteIntervals.

  BlockRange = M->findBlocksAt(Addr(3), Addr(6));
  ASSERT_EQ(std::distance(BlockRange.begin(), BlockRange.end()), 2);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 0), CB31);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 1), CB22);

  ConstBlockRange = CM->findBlocksAt(Addr(3), Addr(6));
  ASSERT_EQ(std::distance(ConstBlockRange.begin(), ConstBlockRange.end()), 2);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 0), CB31);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 1), CB22);

  // Assigning a ByteInterval address may change the query results.

  BI1->setAddress(Addr(4));

  BlockRange = M->findBlocksAt(Addr(3), Addr(6));
  ASSERT_EQ(std::distance(BlockRange.begin(), BlockRange.end()), 3);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 0), CB31);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 1), CB11);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 2), CB22);

  ConstBlockRange = CM->findBlocksAt(Addr(3), Addr(6));
  ASSERT_EQ(std::distance(ConstBlockRange.begin(), ConstBlockRange.end()), 3);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 0), CB31);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 1), CB11);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 2), CB22);

  // Changing a ByteInterval's address may change the query results.

  BI2->setAddress(Addr(4));

  BlockRange = M->findBlocksAt(Addr(3), Addr(6));
  ASSERT_EQ(std::distance(BlockRange.begin(), BlockRange.end()), 3);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 0), CB21);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 1), CB31);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 2), CB11);

  ConstBlockRange = CM->findBlocksAt(Addr(3), Addr(6));
  ASSERT_EQ(std::distance(ConstBlockRange.begin(), ConstBlockRange.end()), 3);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 0), CB21);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 1), CB31);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 2), CB11);

  BI3->setAddress(Addr(0));

  BlockRange = M->findBlocksAt(Addr(3), Addr(6));
  ASSERT_EQ(std::distance(BlockRange.begin(), BlockRange.end()), 2);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 0), CB21);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 1), CB11);

  ConstBlockRange = CM->findBlocksAt(Addr(3), Addr(6));
  ASSERT_EQ(std::distance(ConstBlockRange.begin(), ConstBlockRange.end()), 2);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 0), CB21);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 1), CB11);
}

TEST(Unit_Module, findCodeBlocksAt) {
  auto* M = Module::Create(Ctx, "test");
  auto* S1 = M->addSection(Ctx, "S1");
  auto* BI1 = S1->addByteInterval(Ctx, 16);
  auto* CB11 = BI1->addBlock<CodeBlock>(Ctx, 0, 4);
  auto* S2 = M->addSection(Ctx, "S2");
  auto* BI2 = S2->addByteInterval(Ctx, Addr(0), 10);
  auto* CB21 = BI2->addBlock<CodeBlock>(Ctx, 0, 2);
  auto* CB22 = BI2->addBlock<CodeBlock>(Ctx, 5, 2);
  auto* S3 = M->addSection(Ctx, "S3");
  auto* BI3 = S3->addByteInterval(Ctx, Addr(4), 4);
  auto* CB31 = BI3->addBlock<CodeBlock>(Ctx, 0, 3);
  const Module* CM = M;

  // Querying an out-of-bounds offset produces an empty range.

  auto BlockRange = M->findCodeBlocksAt(Addr(10), Addr(11));
  EXPECT_TRUE(BlockRange.empty());

  auto ConstBlockRange = CM->findCodeBlocksAt(Addr(10), Addr(11));
  EXPECT_TRUE(ConstBlockRange.empty());

  // Querying an in-bounds offset returns the appropriate blocks from all
  // ByteIntervals.

  BlockRange = M->findCodeBlocksAt(Addr(3), Addr(6));
  ASSERT_EQ(std::distance(BlockRange.begin(), BlockRange.end()), 2);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 0), CB31);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 1), CB22);

  ConstBlockRange = CM->findCodeBlocksAt(Addr(3), Addr(6));
  ASSERT_EQ(std::distance(ConstBlockRange.begin(), ConstBlockRange.end()), 2);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 0), CB31);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 1), CB22);

  // Assigning a ByteInterval address may change the query results.

  BI1->setAddress(Addr(4));

  BlockRange = M->findCodeBlocksAt(Addr(3), Addr(6));
  ASSERT_EQ(std::distance(BlockRange.begin(), BlockRange.end()), 3);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 0), CB31);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 1), CB11);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 2), CB22);

  ConstBlockRange = CM->findCodeBlocksAt(Addr(3), Addr(6));
  ASSERT_EQ(std::distance(ConstBlockRange.begin(), ConstBlockRange.end()), 3);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 0), CB31);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 1), CB11);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 2), CB22);

  // Changing a ByteInterval's address may change the query results.

  BI2->setAddress(Addr(4));

  BlockRange = M->findCodeBlocksAt(Addr(3), Addr(6));
  ASSERT_EQ(std::distance(BlockRange.begin(), BlockRange.end()), 3);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 0), CB21);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 1), CB31);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 2), CB11);

  ConstBlockRange = CM->findCodeBlocksAt(Addr(3), Addr(6));
  ASSERT_EQ(std::distance(ConstBlockRange.begin(), ConstBlockRange.end()), 3);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 0), CB21);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 1), CB31);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 2), CB11);

  BI3->setAddress(Addr(0));

  BlockRange = M->findCodeBlocksAt(Addr(3), Addr(6));
  ASSERT_EQ(std::distance(BlockRange.begin(), BlockRange.end()), 2);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 0), CB21);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 1), CB11);

  ConstBlockRange = CM->findCodeBlocksAt(Addr(3), Addr(6));
  ASSERT_EQ(std::distance(ConstBlockRange.begin(), ConstBlockRange.end()), 2);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 0), CB21);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 1), CB11);
}

TEST(Unit_Module, findDataBlocksAt) {
  auto* M = Module::Create(Ctx, "test");
  auto* S1 = M->addSection(Ctx, "S1");
  auto* BI1 = S1->addByteInterval(Ctx, 16);
  auto* CB11 = BI1->addBlock<DataBlock>(Ctx, 0, 4);
  auto* S2 = M->addSection(Ctx, "S2");
  auto* BI2 = S2->addByteInterval(Ctx, Addr(0), 10);
  auto* CB21 = BI2->addBlock<DataBlock>(Ctx, 0, 2);
  auto* CB22 = BI2->addBlock<DataBlock>(Ctx, 5, 2);
  auto* S3 = M->addSection(Ctx, "S3");
  auto* BI3 = S3->addByteInterval(Ctx, Addr(4), 4);
  auto* CB31 = BI3->addBlock<DataBlock>(Ctx, 0, 3);
  const Module* CM = M;

  // Querying an out-of-bounds offset produces an empty range.

  auto BlockRange = M->findDataBlocksAt(Addr(10), Addr(11));
  EXPECT_TRUE(BlockRange.empty());

  auto ConstBlockRange = CM->findDataBlocksAt(Addr(10), Addr(11));
  EXPECT_TRUE(ConstBlockRange.empty());

  // Querying an in-bounds offset returns the appropriate blocks from all
  // ByteIntervals.

  BlockRange = M->findDataBlocksAt(Addr(3), Addr(6));
  ASSERT_EQ(std::distance(BlockRange.begin(), BlockRange.end()), 2);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 0), CB31);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 1), CB22);

  ConstBlockRange = CM->findDataBlocksAt(Addr(3), Addr(6));
  ASSERT_EQ(std::distance(ConstBlockRange.begin(), ConstBlockRange.end()), 2);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 0), CB31);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 1), CB22);

  // Assigning a ByteInterval address may change the query results.

  BI1->setAddress(Addr(4));

  BlockRange = M->findDataBlocksAt(Addr(3), Addr(6));
  ASSERT_EQ(std::distance(BlockRange.begin(), BlockRange.end()), 3);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 0), CB31);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 1), CB11);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 2), CB22);

  ConstBlockRange = CM->findDataBlocksAt(Addr(3), Addr(6));
  ASSERT_EQ(std::distance(ConstBlockRange.begin(), ConstBlockRange.end()), 3);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 0), CB31);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 1), CB11);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 2), CB22);

  // Changing a ByteInterval's address may change the query results.

  BI2->setAddress(Addr(4));

  BlockRange = M->findDataBlocksAt(Addr(3), Addr(6));
  ASSERT_EQ(std::distance(BlockRange.begin(), BlockRange.end()), 3);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 0), CB21);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 1), CB31);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 2), CB11);

  ConstBlockRange = CM->findDataBlocksAt(Addr(3), Addr(6));
  ASSERT_EQ(std::distance(ConstBlockRange.begin(), ConstBlockRange.end()), 3);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 0), CB21);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 1), CB31);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 2), CB11);

  BI3->setAddress(Addr(0));

  BlockRange = M->findDataBlocksAt(Addr(3), Addr(6));
  ASSERT_EQ(std::distance(BlockRange.begin(), BlockRange.end()), 2);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 0), CB21);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 1), CB11);

  ConstBlockRange = CM->findDataBlocksAt(Addr(3), Addr(6));
  ASSERT_EQ(std::distance(ConstBlockRange.begin(), ConstBlockRange.end()), 2);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 0), CB21);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 1), CB11);
}

TEST(Unit_Module, dataObjects) {
  auto* M = Module::Create(Ctx, "M");
  auto* S = M->addSection(Ctx, "test");
  auto* BI = S->addByteInterval(Ctx, Addr(1), 123);
  BI->addBlock<DataBlock>(Ctx, 0, 123);
  ASSERT_NE(M->data_blocks_begin(), M->data_blocks_end());
  EXPECT_EQ(M->data_blocks_begin()->getAddress(), Addr(1));
}

TEST(Unit_Module, findData) {
  auto* M = Module::Create(Ctx, "M");
  auto* S = M->addSection(Ctx, "test");
  auto* BI = S->addByteInterval(Ctx, Addr(0), 30);

  auto* D1 = BI->addBlock<DataBlock>(Ctx, 1, 10);
  auto* D2 = BI->addBlock<DataBlock>(Ctx, 5, 10);

  {
    auto F = M->findDataBlocksOn(Addr(0));
    EXPECT_EQ(std::distance(F.begin(), F.end()), 0);

    F = M->findDataBlocksOn(Addr(1));
    ASSERT_EQ(std::distance(F.begin(), F.end()), 1);
    EXPECT_EQ(&*F.begin(), D1);

    F = M->findDataBlocksOn(Addr(5));
    ASSERT_EQ(std::distance(F.begin(), F.end()), 2);
    EXPECT_EQ(&*F.begin(), D1);
    EXPECT_EQ(&*(++F.begin()), D2);

    F = M->findDataBlocksOn(Addr(10));
    ASSERT_EQ(std::distance(F.begin(), F.end()), 2);
    EXPECT_EQ(&*F.begin(), D1);
    EXPECT_EQ(&*(++F.begin()), D2);

    F = M->findDataBlocksOn(Addr(11));
    ASSERT_EQ(std::distance(F.begin(), F.end()), 1);
    EXPECT_EQ(&*F.begin(), D2);

    F = M->findDataBlocksOn(Addr(14));
    ASSERT_EQ(std::distance(F.begin(), F.end()), 1);
    EXPECT_EQ(&*F.begin(), D2);

    F = M->findDataBlocksOn(Addr(15));
    EXPECT_EQ(std::distance(F.begin(), F.end()), 0);
  }
}

TEST(Unit_Module, symbolIterationOrder) {
  auto* M = Module::Create(Ctx, "M");
  auto* S1 = M->addSymbol(Ctx, Addr(3), "foo");
  auto* S2 = M->addSymbol(Ctx, Addr(2), "bar");
  auto* S3 = M->addSymbol(Ctx, Addr(1), "foo");

  {
    auto F = M->symbols_by_name();
    EXPECT_EQ(std::distance(F.begin(), F.end()), 3);
    auto It = F.begin();
    // symbol_name_iterator returns values in name order but does not specify
    // order for symbols with the same name.
    EXPECT_EQ(&*It++, S2);
    EXPECT_EQ((std::set<Symbol*>{&*It++, &*It++}), (std::set<Symbol*>{S1, S3}));
  }
}

TEST(Unit_Module, findSymbols) {
  auto* M = Module::Create(Ctx, "M");
  auto* S = M->addSection(Ctx, "test");
  auto* BI = S->addByteInterval(Ctx, Addr(1), 1);
  auto* B = BI->addBlock<CodeBlock>(Ctx, 0, 1);

  auto* S1 = M->addSymbol(Ctx, Addr(1), "foo");
  auto* S2 = M->addSymbol(Ctx, B, "bar");
  auto* S3 = M->addSymbol(Ctx, Addr(2), "foo");
  auto* S4 = M->addSymbol(Ctx, B, "baz");

  {
    auto F = M->findSymbols("foo");
    EXPECT_EQ(std::distance(F.begin(), F.end()), 2);
    // Order of S1 and S2 is unspecified.
    EXPECT_EQ((std::set<Symbol*>{&*F.begin(), &*std::next(F.begin(), 1)}),
              (std::set<Symbol*>{S1, S3}));
  }

  {
    auto F = M->findSymbols("bar");
    EXPECT_EQ(std::distance(F.begin(), F.end()), 1);
    EXPECT_EQ(&*F.begin(), S2);
  }

  EXPECT_TRUE(M->findSymbols("notfound").empty());

  {
    auto F = M->findSymbols(Addr(1));
    EXPECT_EQ(std::distance(F.begin(), F.end()), 3);
    // Order of S1, S2, and S4 is unspecified.
    EXPECT_EQ((std::set<Symbol*>{&*F.begin(), &*std::next(F.begin(), 1),
                                 &*std::next(F.begin(), 2)}),
              (std::set<Symbol*>{S1, S2, S4}));
  }

  {
    auto F = M->findSymbols(Addr(2));
    EXPECT_EQ(std::distance(F.begin(), F.end()), 1);
    EXPECT_EQ(&*F.begin(), S3);
  }

  EXPECT_TRUE(M->findSymbols(Addr(3)).empty());

  {
    auto F = M->findSymbols(Addr(0), Addr(2));
    EXPECT_EQ(std::distance(F.begin(), F.end()), 3);
    // Order of S1, S2, and S4 is unspecified.
    EXPECT_EQ((std::set<Symbol*>{&*F.begin(), &*std::next(F.begin(), 1),
                                 &*std::next(F.begin(), 2)}),
              (std::set<Symbol*>{S1, S2, S4}));
  }

  {
    auto F = M->findSymbols(Addr(0), Addr(5));
    EXPECT_EQ(std::distance(F.begin(), F.end()), 4);
    // Order of S1, S2, and S4 is unspecified. All three should be returned
    // before S3.
    EXPECT_EQ((std::set<Symbol*>{&*F.begin(), &*std::next(F.begin(), 1),
                                 &*std::next(F.begin(), 2)}),
              (std::set<Symbol*>{S1, S2, S4}));
    EXPECT_EQ(&*std::next(F.begin(), 3), S3);
  }

  {
    auto F = M->findSymbols(Addr(10), Addr(25));
    EXPECT_EQ(std::distance(F.begin(), F.end()), 0);
  }

  {
    auto F = M->findSymbols(*B);
    EXPECT_EQ(std::distance(F.begin(), F.end()), 2);
    // Order of S2 and S4 is unspecified.
    EXPECT_EQ((std::set<Symbol*>{&*F.begin(), &*std::next(F.begin(), 1)}),
              (std::set<Symbol*>{S2, S4}));
  }
}

TEST(Unit_Module, symbolWithoutAddr) {
  auto* M = Module::Create(Ctx, "M");
  M->addSymbol(Ctx, "test");
  EXPECT_EQ(M->findSymbols("test").begin()->getName(), "test");
}

TEST(Unit_Module, renameSymbol) {
  auto* M = Module::Create(Ctx, "M");
  auto* S1 = M->addSymbol(Ctx, "foo");
  auto* S2 = M->addSymbol(Ctx, Addr(1), "bar");
  auto* S3 = M->addSymbol(Ctx, Addr(2), "bar");

  S1->setName("test1");
  S2->setName("test2");

  {
    auto F = M->findSymbols("foo");
    EXPECT_EQ(std::distance(F.begin(), F.end()), 0);

    F = M->findSymbols("bar");
    EXPECT_EQ(std::distance(F.begin(), F.end()), 1);
    EXPECT_EQ(&*F.begin(), S3);

    F = M->findSymbols("test1");
    EXPECT_EQ(std::distance(F.begin(), F.end()), 1);
    EXPECT_EQ(&*F.begin(), S1);

    F = M->findSymbols("test2");
    EXPECT_EQ(std::distance(F.begin(), F.end()), 1);
    EXPECT_EQ(&*F.begin(), S2);
  }
  {
    auto F = M->findSymbols(Addr(1));
    EXPECT_EQ(std::distance(F.begin(), F.end()), 1);
    EXPECT_EQ(&*F.begin(), S2);

    F = M->findSymbols(Addr(2));
    EXPECT_EQ(std::distance(F.begin(), F.end()), 1);
    EXPECT_EQ(&*F.begin(), S3);
  }
}

TEST(Unit_Module, setReferent) {
  auto* M = Module::Create(Ctx, "M");
  auto* S = M->addSection(Ctx, "test");
  auto* BI = S->addByteInterval(Ctx, Addr(0), 5);

  auto* B1 = BI->addBlock<CodeBlock>(Ctx, 1, 1);
  auto* B2 = BI->addBlock<CodeBlock>(Ctx, 2, 1);
  auto* B3 = BI->addBlock<CodeBlock>(Ctx, 3, 1);
  auto* B4 = BI->addBlock<CodeBlock>(Ctx, 4, 1);
  auto* B5 = BI->addBlock<CodeBlock>(Ctx, 5, 1);
  auto* S1 = M->addSymbol(Ctx, "foo");
  auto* S2 = M->addSymbol(Ctx, B1, "bar");
  auto* S3 = M->addSymbol(Ctx, B1, "foo");
  auto* S4 = M->addSymbol(Ctx, B2, "bar");

  S1->setReferent(B3);
  S2->setReferent(B4);
  S4->setReferent(B5);

  {
    auto F = M->findSymbols("foo");
    EXPECT_EQ(std::distance(F.begin(), F.end()), 2);
    EXPECT_EQ(&*F.begin(), S1);
    EXPECT_EQ(&*(++F.begin()), S3);

    F = M->findSymbols("bar");
    EXPECT_EQ(std::distance(F.begin(), F.end()), 2);
    EXPECT_EQ(&*F.begin(), S2);
    EXPECT_EQ(&*(++F.begin()), S4);
  }

  {
    auto F = M->findSymbols(Addr(1));
    EXPECT_EQ(std::distance(F.begin(), F.end()), 1);
    EXPECT_EQ(&*F.begin(), S3);

    F = M->findSymbols(Addr(2));
    EXPECT_EQ(std::distance(F.begin(), F.end()), 0);

    F = M->findSymbols(Addr(3));
    EXPECT_EQ(std::distance(F.begin(), F.end()), 1);
    EXPECT_EQ(&*F.begin(), S1);

    F = M->findSymbols(Addr(4));
    EXPECT_EQ(std::distance(F.begin(), F.end()), 1);
    EXPECT_EQ(&*F.begin(), S2);

    F = M->findSymbols(Addr(5));
    EXPECT_EQ(std::distance(F.begin(), F.end()), 1);
    EXPECT_EQ(&*F.begin(), S4);
  }
}

TEST(Unit_Module, setSymbolAddress) {
  auto* M = Module::Create(Ctx, "M");
  auto* S = M->addSection(Ctx, "test");
  auto* BI = S->addByteInterval(Ctx, Addr(0), 5);

  auto* B1 = BI->addBlock<CodeBlock>(Ctx, 1, 1);
  auto* S1 = M->addSymbol(Ctx, "foo");
  auto* S2 = M->addSymbol(Ctx, B1, "bar");
  auto* S3 = M->addSymbol(Ctx, B1, "bar");

  S1->setAddress(Addr(2));
  S2->setAddress(Addr(3));

  {
    auto F = M->findSymbols("bar");
    EXPECT_EQ(std::distance(F.begin(), F.end()), 2);
    EXPECT_EQ(&*F.begin(), S2);
    EXPECT_EQ(&*(++F.begin()), S3);
  }

  {
    auto F = M->findSymbols(Addr(1));
    EXPECT_EQ(std::distance(F.begin(), F.end()), 1);
    EXPECT_EQ(&*F.begin(), S3);

    F = M->findSymbols(Addr(2));
    EXPECT_EQ(std::distance(F.begin(), F.end()), 1);
    EXPECT_EQ(&*F.begin(), S1);

    F = M->findSymbols(Addr(3));
    EXPECT_EQ(std::distance(F.begin(), F.end()), 1);
    EXPECT_EQ(&*F.begin(), S2);
  }
}

TEST(Unit_Module, symbolicExpressions) {
  auto* M = Module::Create(Ctx, "M");
  auto* S = M->addSection(Ctx, "test");
  auto* BI = S->addByteInterval(Ctx, Addr(1), 123);
  auto* Sym = M->addSymbol(Ctx, "test");

  BI->addSymbolicExpression(0, SymAddrConst{0, Sym});
  EXPECT_EQ(std::distance(M->symbolic_expressions_begin(),
                          M->symbolic_expressions_end()),
            1);
}

TEST(Unit_Module, findSymbolicExpressionsAts) {
  auto* M = Module::Create(Ctx, "M");
  auto* S = M->addSection(Ctx, "test");
  auto* BI = S->addByteInterval(Ctx, Addr(0), 10);

  auto* S1 = M->addSymbol(Ctx, Addr(1), "foo");
  auto* S2 = M->addSymbol(Ctx, Addr(5), "bar");

  BI->addSymbolicExpression(1, SymAddrConst{0, S1});
  BI->addSymbolicExpression(5, SymAddrConst{0, S2});

  {
    auto F = M->findSymbolicExpressionsAt(Addr(1), Addr(5));
    ASSERT_EQ(std::distance(F.begin(), F.end()), 1);
    EXPECT_EQ(std::get<SymAddrConst>(F.begin()->getSymbolicExpression()).Sym,
              S1);
  }

  {
    auto F = M->findSymbolicExpressionsAt(Addr(1), Addr(6));
    ASSERT_EQ(std::distance(F.begin(), F.end()), 2);
    EXPECT_EQ(std::get<SymAddrConst>(F.begin()->getSymbolicExpression()).Sym,
              S1);
    EXPECT_EQ(
        std::get<SymAddrConst>((++F.begin())->getSymbolicExpression()).Sym, S2);
  }

  {
    auto F = M->findSymbolicExpressionsAt(Addr(1), Addr(3));
    ASSERT_EQ(std::distance(F.begin(), F.end()), 1);
    EXPECT_EQ(std::get<SymAddrConst>(F.begin()->getSymbolicExpression()).Sym,
              S1);
  }

  {
    auto F = M->findSymbolicExpressionsAt(Addr(6), Addr(50));
    EXPECT_EQ(std::distance(F.begin(), F.end()), 0);
  }
}

TEST(Unit_Module, protobufRoundTrip) {
  using STH = gtirb::SerializationTestHarness;
  std::stringstream ss;

  UUID BlockID, DataID, ProxyID, SectionID;
  size_t WhichSymbolic;

  {
    Context InnerCtx;
    IR* OI = IR::Create(InnerCtx);
    Module* Original = OI->addModule(InnerCtx, "module");
    Original->setBinaryPath("test");
    Original->setPreferredAddr(Addr(3));
    Original->setRebaseDelta(4);
    Original->setFileFormat(FileFormat::ELF);
    Original->setISA(ISA::X64);
    Original->setByteOrder(ByteOrder::Little);
    Original->addAuxData<AnTest>(0);
    Symbol* Sym = Original->addSymbol(InnerCtx, Addr(1), "name1");
    Original->addSymbol(InnerCtx, Addr(2), "name1");
    Original->addSymbol(InnerCtx, Addr(1), "name3");
    auto S = Original->addSection(InnerCtx, "test");
    auto BI = S->addByteInterval(InnerCtx, Addr(1), 2);
    BI->addBlock<CodeBlock>(InnerCtx, 0, 2);
    BI->addBlock<DataBlock>(InnerCtx, 0, 2);
    auto* P = Original->addProxyBlock(InnerCtx);
    BI->addSymbolicExpression<SymAddrConst>(7, 0, Sym);
    BlockID = blocks(Original->getIR()->getCFG()).begin()->getUUID();
    DataID = Original->data_blocks_begin()->getUUID();
    ProxyID = P->getUUID();
    SectionID = Original->sections_begin()->getUUID();
    WhichSymbolic = Original->symbolic_expressions_begin()->getOffset();

    STH::save(*Original, ss);
  }

  Module* Result = STH::load<Module>(Ctx, ss);
  IR::Create(Ctx)->addModule(Result);

  EXPECT_EQ(Result->getBinaryPath(), "test");
  EXPECT_EQ(Result->getPreferredAddr(), Addr(3));
  EXPECT_EQ(Result->getRebaseDelta(), 4);
  EXPECT_EQ(Result->getFileFormat(), FileFormat::ELF);
  EXPECT_EQ(Result->getISA(), ISA::X64);
  EXPECT_EQ(Result->getByteOrder(), ByteOrder::Little);
  EXPECT_EQ(Result->getName(), "module");

  // Make sure all symbols are present despite repeated names and addresses.
  EXPECT_EQ(std::distance(Result->symbols_begin(), Result->symbols_end()), 3);
  {
    auto Found = Result->findSymbols("name1");
    EXPECT_EQ(distance(Found.begin(), Found.end()), 2);
  }
  {
    auto Found = Result->findSymbols(Addr(1));
    EXPECT_EQ(distance(Found.begin(), Found.end()), 2);
  }

  // Make sure various collections and node members are serialized, but
  // don't check in detail as they have their own unit tests.
  EXPECT_EQ(Result->getAuxDataSize(), 1);
  EXPECT_NE(Result->getAuxData<AnTest>(), nullptr);

  ASSERT_EQ(num_vertices(Result->getIR()->getCFG()), 2);
  {
    auto Nodes = nodes(Result->getIR()->getCFG());
    auto It = Nodes.begin();
    EXPECT_TRUE(&*It);
    EXPECT_TRUE(It->getUUID() == BlockID || It->getUUID() == ProxyID);
    ++It;
    EXPECT_TRUE(&*It);
    EXPECT_NE(Nodes.begin()->getUUID(), It->getUUID());
    EXPECT_TRUE(It->getUUID() == BlockID || It->getUUID() == ProxyID);
  }

  ASSERT_EQ(
      std::distance(Result->code_blocks_begin(), Result->code_blocks_end()), 1);
  EXPECT_EQ(Result->code_blocks_begin()->getUUID(), BlockID);
  ASSERT_EQ(
      std::distance(Result->data_blocks_begin(), Result->data_blocks_end()), 1);
  EXPECT_EQ(Result->data_blocks_begin()->getUUID(), DataID);
  ASSERT_EQ(
      std::distance(Result->proxy_blocks_begin(), Result->proxy_blocks_end()),
      1);
  EXPECT_EQ(Result->proxy_blocks_begin()->getUUID(), ProxyID);
  EXPECT_EQ(Result->proxy_blocks_begin()->getModule(), Result);

  ASSERT_EQ(std::distance(Result->sections_begin(), Result->sections_end()), 1);
  EXPECT_EQ(Result->sections_begin()->getUUID(), SectionID);

  ASSERT_EQ(std::distance(Result->symbolic_expressions_begin(),
                          Result->symbolic_expressions_end()),
            1);
  EXPECT_EQ(Result->symbolic_expressions_begin()->getOffset(), WhichSymbolic);
}

TEST(Unit_Module, protobufNodePointers) {
  // Ensure that when we cannot load an object that does not exist in the
  // serialized form that we fail to load the GTIRB again because it is wrong.
  using STH = gtirb::SerializationTestHarness;
  std::stringstream ss;

  {
    Context InnerCtx;
    auto* Original = Module::Create(InnerCtx, "M");
    auto* S = Original->addSection(InnerCtx, "test");
    auto* BI = S->addByteInterval(InnerCtx, Addr(1), 2);
    auto* Data = BI->addBlock<DataBlock>(InnerCtx, 0, 0);
    auto* DataSym = Original->addSymbol(InnerCtx, Data, "data");

    // Not part of IR
    auto* DanglingData = DataBlock::Create(InnerCtx, 0);
    Original->addSymbol(InnerCtx, DanglingData, "dangling");

    auto* Code = BI->addBlock<CodeBlock>(InnerCtx, 0, 2);
    Original->addSymbol(InnerCtx, Code, "code");
    BI->addSymbolicExpression<SymAddrConst>(2, 0, DataSym);

    // Not part of IR
    auto* DanglingSym = Symbol::Create(InnerCtx, Addr(1), "foo");
    BI->addSymbolicExpression<SymAddrConst>(3, 0, DanglingSym);

    STH::save(*Original, ss);
  }

  auto* Result = STH::load<Module>(Ctx, ss);
  EXPECT_EQ(Result, nullptr);
}

TEST(Unit_Module, removeNodes) {
  auto* M = Module::Create(Ctx, "M");
  auto* S = M->addSection(Ctx, "test");
  auto* BI = S->addByteInterval(Ctx, Addr(0), 0);
  BI->addBlock<CodeBlock>(Ctx, 0, 0);
  BI->addBlock<DataBlock>(Ctx, 0, 0);
  auto* P = M->addProxyBlock(Ctx);
  auto* Sym = M->addSymbol(Ctx, "test");

  EXPECT_EQ(std::distance(M->sections_begin(), M->sections_end()), 1);
  EXPECT_EQ(std::distance(M->byte_intervals_begin(), M->byte_intervals_end()),
            1);
  EXPECT_EQ(std::distance(M->code_blocks_begin(), M->code_blocks_end()), 1);
  EXPECT_EQ(std::distance(M->data_blocks_begin(), M->data_blocks_end()), 1);
  EXPECT_EQ(std::distance(M->proxy_blocks_begin(), M->proxy_blocks_end()), 1);
  EXPECT_EQ(std::distance(M->symbols_begin(), M->symbols_end()), 1);

  M->removeSection(S);

  EXPECT_EQ(std::distance(M->sections_begin(), M->sections_end()), 0);
  EXPECT_EQ(std::distance(M->byte_intervals_begin(), M->byte_intervals_end()),
            0);
  EXPECT_EQ(std::distance(M->code_blocks_begin(), M->code_blocks_end()), 0);
  EXPECT_EQ(std::distance(M->data_blocks_begin(), M->data_blocks_end()), 0);
  EXPECT_EQ(std::distance(M->proxy_blocks_begin(), M->proxy_blocks_end()), 1);
  EXPECT_EQ(std::distance(M->symbols_begin(), M->symbols_end()), 1);

  M->removeProxyBlock(P);

  EXPECT_EQ(std::distance(M->sections_begin(), M->sections_end()), 0);
  EXPECT_EQ(std::distance(M->byte_intervals_begin(), M->byte_intervals_end()),
            0);
  EXPECT_EQ(std::distance(M->code_blocks_begin(), M->code_blocks_end()), 0);
  EXPECT_EQ(std::distance(M->data_blocks_begin(), M->data_blocks_end()), 0);
  EXPECT_EQ(std::distance(M->proxy_blocks_begin(), M->proxy_blocks_end()), 0);
  EXPECT_EQ(std::distance(M->symbols_begin(), M->symbols_end()), 1);

  M->removeSymbol(Sym);

  EXPECT_EQ(std::distance(M->sections_begin(), M->sections_end()), 0);
  EXPECT_EQ(std::distance(M->byte_intervals_begin(), M->byte_intervals_end()),
            0);
  EXPECT_EQ(std::distance(M->code_blocks_begin(), M->code_blocks_end()), 0);
  EXPECT_EQ(std::distance(M->data_blocks_begin(), M->data_blocks_end()), 0);
  EXPECT_EQ(std::distance(M->proxy_blocks_begin(), M->proxy_blocks_end()), 0);
  EXPECT_EQ(std::distance(M->symbols_begin(), M->symbols_end()), 0);
}

TEST(Unit_Module, removeInvalidSection) {
  auto* M1 = Module::Create(Ctx, "M1");
  auto* M2 = Module::Create(Ctx, "M2");
  auto* S1 = M1->addSection(Ctx, "S1");
  S1->addByteInterval(Ctx, Addr(0), 10);
  auto* S2 = M2->addSection(Ctx, "S2");
  S2->addByteInterval(Ctx, Addr(0), 10);

  EXPECT_FALSE(M1->sections().empty());
  EXPECT_FALSE(M1->findSectionsOn(Addr(5)).empty());
  EXPECT_FALSE(M2->sections().empty());
  EXPECT_FALSE(M2->findSectionsOn(Addr(5)).empty());

  // Removing a section from a Module that isn't its parent should have no
  // effect.
  M1->removeSection(S2);

  EXPECT_FALSE(M1->sections().empty());
  EXPECT_FALSE(M1->findSectionsOn(Addr(5)).empty());
  EXPECT_FALSE(M2->sections().empty());
  EXPECT_FALSE(M2->findSectionsOn(Addr(5)).empty());
}

TEST(Unit_Module, mutateBlocksWithSymbols) {
  auto* M = Module::Create(Ctx, "M");
  auto* S = M->addSection(Ctx, "test");
  auto* BIC = S->addByteInterval(Ctx, Addr(0), 10);
  auto* BID = S->addByteInterval(Ctx, Addr(10), 10);
  auto* CB = BIC->addBlock<CodeBlock>(Ctx, 1, 2);
  auto* DB = BID->addBlock<DataBlock>(Ctx, 3, 4);
  auto* SymC = M->addSymbol(Ctx, CB, "code");
  auto* SymD = M->addSymbol(Ctx, DB, "data");
  Module::symbol_addr_range Range;

  Range = M->findSymbols(Addr(1));
  EXPECT_EQ(std::distance(Range.begin(), Range.end()), 1);
  EXPECT_EQ(&Range.front(), SymC);

  Range = M->findSymbols(Addr(13));
  EXPECT_EQ(std::distance(Range.begin(), Range.end()), 1);
  EXPECT_EQ(&Range.front(), SymD);

  Range = M->findSymbols(Addr(21));
  EXPECT_EQ(std::distance(Range.begin(), Range.end()), 0);

  BIC->setAddress(Addr(20));

  Range = M->findSymbols(Addr(1));
  EXPECT_EQ(std::distance(Range.begin(), Range.end()), 0);

  Range = M->findSymbols(Addr(13));
  EXPECT_EQ(std::distance(Range.begin(), Range.end()), 1);
  EXPECT_EQ(&Range.front(), SymD);

  Range = M->findSymbols(Addr(21));
  EXPECT_EQ(std::distance(Range.begin(), Range.end()), 1);
  EXPECT_EQ(&Range.front(), SymC);
}

TEST(Unit_Module, addBlocksWithSymbols) {
  auto* M = Module::Create(Ctx, "M");
  auto* S = M->addSection(Ctx, "test");
  auto* BI1 = S->addByteInterval(Ctx, Addr(0), 10);
  auto* BI2 = S->addByteInterval(Ctx, Addr(10), 10);
  auto* BI3 = S->addByteInterval(Ctx, Addr(20), 10);
  auto* BC = BI1->addBlock<CodeBlock>(Ctx, 1, 2);
  auto* BD = BI2->addBlock<DataBlock>(Ctx, 1, 2);
  auto* SymC = M->addSymbol(Ctx, BC, "code");
  auto* SymD = M->addSymbol(Ctx, BD, "data");

  Module::symbol_addr_range Range;

  Range = M->findSymbols(Addr(1));
  EXPECT_EQ(std::distance(Range.begin(), Range.end()), 1);
  EXPECT_EQ(&Range.front(), SymC);

  Range = M->findSymbols(Addr(11));
  EXPECT_EQ(std::distance(Range.begin(), Range.end()), 1);
  EXPECT_EQ(&Range.front(), SymD);

  Range = M->findSymbols(Addr(21));
  EXPECT_EQ(std::distance(Range.begin(), Range.end()), 0);

  BI3->addBlock(1, BC);

  Range = M->findSymbols(Addr(1));
  EXPECT_EQ(std::distance(Range.begin(), Range.end()), 0);

  Range = M->findSymbols(Addr(11));
  EXPECT_EQ(std::distance(Range.begin(), Range.end()), 1);
  EXPECT_EQ(&Range.front(), SymD);

  Range = M->findSymbols(Addr(21));
  EXPECT_EQ(std::distance(Range.begin(), Range.end()), 1);
  EXPECT_EQ(&Range.front(), SymC);
}


================================================
FILE: src/test/Node.test.cpp
================================================
//===- Node.test.cpp --------------------------------------------*- C++ -*-===//
//
//  Copyright (C) 2020 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
#include <gtirb/Context.hpp>
#include <gtirb/Node.hpp>
#include <fstream>
#include <gtest/gtest.h>

static gtirb::Context Ctx;

TEST(Unit_Node, ctor_0) { EXPECT_NE(gtirb::Node::Create(Ctx), nullptr); }

TEST(Unit_Node, uniqueUuids) {
  std::vector<gtirb::UUID> Uuids;

  // Create a bunch of UUID's, then make sure we don't have any duplicates.

  for (size_t I = 0; I < 512; ++I) {
    const auto* N = gtirb::Node::Create(Ctx);
    Uuids.push_back(N->getUUID());
  }

  std::sort(std::begin(Uuids), std::end(Uuids));
  const auto end = std::unique(std::begin(Uuids), std::end(Uuids));

  EXPECT_EQ(std::end(Uuids), end) << "Duplicate UUID's were generated.";
}

// TEST(Unit_Node, copyGetsNewUUID) {
//  gtirb::Node *Node = gtirb::Node::Create(Ctx);
//  gtirb::Node Copy(*Node);
//
//  EXPECT_NE(Node->getUUID(), Copy.getUUID());
//  EXPECT_EQ(gtirb::Node::getByUUID(Node->getUUID()), Node);
//  EXPECT_EQ(gtirb::Node::getByUUID(Copy.getUUID()), &Copy);
//}

TEST(Unit_Node, getByUUID) {
  gtirb::Node* N = gtirb::Node::Create(Ctx);

  EXPECT_EQ(gtirb::Node::getByUUID(Ctx, N->getUUID()), N);

  const gtirb::Context& ConstCtx = Ctx;
  EXPECT_EQ(gtirb::Node::getByUUID(ConstCtx, N->getUUID()), N);
}


================================================
FILE: src/test/Offset.test.cpp
================================================
//===- Offset.test.cpp ------------------------------------------*- C++ -*-===//
//
//  Copyright (C) 2020 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
#include <gtirb/Offset.hpp>
#include <boost/uuid/random_generator.hpp>
#include <gtest/gtest.h>

using namespace gtirb;

TEST(Unit_Offset, ordering) {
  UUID uuid1{boost::uuids::random_generator()()};
  UUID uuid2{boost::uuids::random_generator()()};
  uint64_t disp1(5);
  uint64_t disp2(10);
  Offset offset1(uuid1, disp1);
  Offset offset2(uuid1, disp2);
  Offset offset3(uuid2, disp1);
  Offset offset4(uuid2, disp2);
  EXPECT_TRUE(offset1 < offset2);
  EXPECT_TRUE(offset3 < offset4);
  if (uuid1 < uuid2) {
    EXPECT_TRUE(offset1 < offset3);
    EXPECT_TRUE(offset2 < offset3);
    EXPECT_TRUE(offset1 < offset4);
    EXPECT_TRUE(offset2 < offset4);
  }
  if (uuid2 < uuid1) {
    EXPECT_TRUE(offset1 > offset3);
    EXPECT_TRUE(offset2 > offset3);
    EXPECT_TRUE(offset1 > offset4);
    EXPECT_TRUE(offset2 > offset4);
  }
}

TEST(Unit_Offset, hash) {
  UUID uuid1{boost::uuids::random_generator()()};
  uint64_t disp1(5);
  uint64_t disp2(10);
  Offset offset1(uuid1, disp1);
  Offset offset2(uuid1, disp2);
  EXPECT_EQ(std::hash<Offset>()(offset1), std::hash<Offset>()(offset1));
  EXPECT_NE(std::hash<Offset>()(offset1), std::hash<Offset>()(offset2));
}


================================================
FILE: src/test/PrepDeathTest.hpp
================================================
#ifndef PREP_DEATH_TEST_HPP
#define PREP_DEATH_TEST_HPP

#include "config-test.h"

#ifdef HAVE_RESOURCE_H
#include <cstdlib>
#include <cstring>
#include <sys/resource.h>

// Constructing an instance of this class will inhibit dumping of a
// core file on systems that support get/setrlimit(). This is useful
// to avoid generating core files when running death tests (tests that
// are designed to trigger failures - particularly assertions.) On
// destruction, the previous rlimit for core files is restored.
//
// One can set the env variable DEATH_TEST_CORE to a non-zero value to
// override this and still generate a core.
class PrepDeathTest {
public:
  PrepDeathTest() {
    char* EnvVar = getenv("DEATH_TEST_CORE");
    if (EnvVar == nullptr || strcmp(EnvVar, "0") == 0) {
      struct rlimit CurrCoreRLimit;
      if (getrlimit(RLIMIT_CORE, &CurrCoreRLimit) != 0) {
        // If this fails, just drop out and don't worry about
        // it. We'll just have to deal with extraneous cores.
        return;
      }

      PrevCoreRLimit = CurrCoreRLimit;
      CurrCoreRLimit.rlim_cur = 0;
      if (setrlimit(RLIMIT_CORE, &CurrCoreRLimit) != 0) {
        // If this fails, just drop out and don't worry about
        // it. We'll just have to deal with extraneous cores.
        return;
      }

      RLimitSet = true;
    }
  }

  ~PrepDeathTest() {
    if (RLimitSet) {
      setrlimit(RLIMIT_CORE, &PrevCoreRLimit);
    }
  }

private:
  bool RLimitSet = false;
  rlimit PrevCoreRLimit;
};

#else // HAVE_RESOURCE_H

// When we're not on a system that supports get/setrlimit(),
// PrepDeathTest is just a nop.
class PrepDeathTest {};

#endif // HAVE_RESOURCE_H

#endif // PREP_DEATH_TEST_HPP


================================================
FILE: src/test/PrepTestGTIRB.cpp
================================================
// This is a small utility program to generate a GTIRB file that can
// then be loaded by TestGTIRB. The fact this is a separate program
// allows us to test some aspects of the AuxDataContainer
// implementation that depend on different processes having different
// type schemas registered for AuxData types.

#include "AuxDataContainerSchema.hpp"
#include <gtirb/AuxDataContainer.hpp>
#include <gtirb/Context.hpp>
#include <gtirb/IR.hpp>
#include <fstream>
#include <iostream>

void registerAuxDataTypes() {
  // This schema is *registered* here but unregistered in the unit test.
  gtirb::AuxDataContainer::registerAuxDataType<
      gtirb::schema::UnRegisteredType>();
}

int main(int argc, char* argv[]) {
  registerAuxDataTypes();

  // Name of the gtirb file to create is expected in argv[1].
  std::string GtirbFilename;
  if (argc >= 2) {
    GtirbFilename = argv[1];
  }

  if (GtirbFilename.empty()) {
    std::cerr << "*\n* No pre-built GTIRB file specified, cannot create GTIRB "
                 "test file!\n*\n";
    return -1;
  }

  std::ofstream GtirbFile;
  GtirbFile.open(GtirbFilename, std::ifstream::out | std::ifstream::binary);

  if (!GtirbFile) {
    std::cerr << "*\n* Failed to create GTIRB file: " << GtirbFilename
              << "\n*\n";
    return -1;
  }

  gtirb::Context Ctx;
  gtirb::IR* Ir = gtirb::IR::Create(Ctx);

  // Add content to the IR that the unit test can make use of.
  Ir->addAuxData<gtirb::schema::UnRegisteredType>(42);

  Ir->save(GtirbFile);
  GtirbFile.close();

  return 0;
}


================================================
FILE: src/test/ProxyBlock.test.cpp
================================================
//===- ProxyBlock.test.cpp ---------------------------------------*- C++
//-*-===//
//
//  Copyright (C) 2020 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
#include "SerializationTestHarness.hpp"
#include <gtirb/Context.hpp>
#include <gtirb/ProxyBlock.hpp>
#include <gtest/gtest.h>
#include <sstream>

using namespace gtirb;

static Context Ctx;

TEST(Unit_ProxyBlock, noCopyMoveConstructors) {
  EXPECT_FALSE(std::is_copy_constructible_v<ProxyBlock>);
  EXPECT_FALSE(std::is_move_constructible_v<ProxyBlock>);
  EXPECT_FALSE(std::is_copy_assignable_v<ProxyBlock>);
  EXPECT_FALSE(std::is_move_assignable_v<ProxyBlock>);
}

TEST(Unit_ProxyBlock, protobufRoundTrip) {
  using STH = gtirb::SerializationTestHarness;
  std::stringstream ss;
  UUID uuid;
  {
    Context InnerCtx;
    ProxyBlock* Original = ProxyBlock::Create(InnerCtx);
    uuid = Original->getUUID();
    STH::save(*Original, ss);
  }
  ProxyBlock* Result = STH::load<ProxyBlock>(Ctx, ss);

  EXPECT_EQ(uuid, Result->getUUID());
  EXPECT_EQ(Result->getModule(), nullptr);
}


================================================
FILE: src/test/Section.test.cpp
================================================
//===- Section.test.cpp -----------------------------------------*- C++ -*-===//
//
//  Copyright (C) 2020 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
#include "SerializationTestHarness.hpp"
#include "TestHelpers.hpp"
#include <gtirb/Context.hpp>
#include <gtirb/Section.hpp>
#include <gtirb/proto/Section.pb.h>
#include <gtest/gtest.h>
#include <limits>
#include <sstream>

using namespace gtirb;

static Context Ctx;

TEST(Unit_Section, compilationIteratorTypes) {
  static_assert(std::is_same_v<Section::block_iterator::reference, Node&>);
  static_assert(
      std::is_same_v<Section::const_block_iterator::reference, const Node&>);
  static_assert(
      std::is_same_v<Section::block_subrange::iterator::reference, Node&>);
  static_assert(
      std::is_same_v<Section::const_block_subrange::iterator::reference,
                     const Node&>);

  {
    Section::block_iterator BIt;
    Section::const_block_iterator CBIt = BIt;
    CBIt = BIt;

    Section::block_range BRng;
    Section::const_block_range CBRng = BRng;
    CBRng = BRng;
  }
  static_assert(!std::is_convertible_v<Section::const_block_iterator,
                                       Section::block_iterator>);
  static_assert(
      !std::is_convertible_v<Section::const_block_range, Section::block_range>);
}

TEST(Unit_Section, noCopyMoveConstructors) {
  EXPECT_FALSE(std::is_copy_constructible_v<Section>);
  EXPECT_FALSE(std::is_move_constructible_v<Section>);
  EXPECT_FALSE(std::is_copy_assignable_v<Section>);
  EXPECT_FALSE(std::is_move_assignable_v<Section>);
}

TEST(Unit_Section, getAddress) {
  using OAddr = std::optional<Addr>;
  using OSize = std::optional<uint64_t>;

  auto* S = Section::Create(Ctx, "test");
  EXPECT_EQ(S->getAddress(), OAddr());
  EXPECT_EQ(S->getSize(), OSize());

  S->addByteInterval(Ctx, Addr(5), 10);
  EXPECT_EQ(S->getAddress(), OAddr(Addr(5)));
  EXPECT_EQ(S->getSize(), OSize(10));

  S->addByteInterval(Ctx, Addr(15), 10);
  EXPECT_EQ(S->getAddress(), OAddr(Addr(5)));
  EXPECT_EQ(S->getSize(), OSize(20));

  S->addByteInterval(Ctx, OAddr(), 10);
  EXPECT_EQ(S->getAddress(), OAddr());
  EXPECT_EQ(S->getSize(), OSize());
}

TEST(Unit_Section, flags) {
  auto* S = Section::Create(Ctx, "test");
  EXPECT_FALSE(S->isFlagSet(SectionFlag::Undefined));

  S->addFlag(SectionFlag::Executable);
  EXPECT_TRUE(S->isFlagSet(SectionFlag::Executable));

  S->removeFlag(SectionFlag::Executable);
  EXPECT_FALSE(S->isFlagSet(SectionFlag::Executable));

  S->addFlags(SectionFlag::Initialized, SectionFlag::Loaded);
  if (*S->flags_begin() == SectionFlag::Initialized)
    EXPECT_EQ(SectionFlag::Loaded, *(++S->flags_begin()));
  else {
    EXPECT_EQ(SectionFlag::Loaded, *S->flags_begin());
    EXPECT_EQ(SectionFlag::Initialized, *(++S->flags_begin()));
  }
}

TEST(Unit_Section, protobufRoundTrip) {
  using STH = gtirb::SerializationTestHarness;
  std::stringstream ss;

  {
    Context InnerCtx;
    auto* Original = Section::Create(InnerCtx, "name");
    Original->addFlags(SectionFlag::Executable, SectionFlag::Loaded,
                       SectionFlag::Writable);
    STH::save(*Original, ss);
  }
  auto* Result = STH::load<Section>(Ctx, ss);

  EXPECT_EQ(Result->getName(), "name");
  EXPECT_TRUE(Result->isFlagSet(SectionFlag::Executable));
  EXPECT_TRUE(Result->isFlagSet(SectionFlag::Loaded));
  EXPECT_TRUE(Result->isFlagSet(SectionFlag::Writable));
  EXPECT_FALSE(Result->isFlagSet(SectionFlag::Initialized));
  EXPECT_FALSE(Result->isFlagSet(SectionFlag::Readable));
  EXPECT_FALSE(Result->isFlagSet(SectionFlag::ThreadLocal));
}

TEST(Unit_Section, findByteIntervalsOn) {
  auto* S = Section::Create(Ctx, "test");
  auto* BI1 = S->addByteInterval(Ctx, 16);
  auto* BI2 = S->addByteInterval(Ctx, Addr(8), 12);
  auto* BI3 = S->addByteInterval(Ctx, Addr(13), 8);
  const Section* CS = S;

  // Querying an out-of-bounds address returns an empty range.

  auto Range = S->findByteIntervalsOn(Addr(0));
  EXPECT_TRUE(Range.empty());

  auto ConstRange = CS->findByteIntervalsOn(Addr(0));
  EXPECT_TRUE(Range.empty());

  // Querying a in-bounds address returns the correct range.

  Range = S->findByteIntervalsOn(Addr(12));
  ASSERT_EQ(std::distance(Range.begin(), Range.end()), 1);
  EXPECT_EQ(&*Range.begin(), BI2);

  ConstRange = CS->findByteIntervalsOn(Addr(12));
  ASSERT_EQ(std::distance(ConstRange.begin(), ConstRange.end()), 1);
  EXPECT_EQ(&*ConstRange.begin(), BI2);

  // Query returns correct set after addresses are updated.

  BI1->setAddress(Addr(0));
  Range = S->findByteIntervalsOn(Addr(0));
  ASSERT_EQ(std::distance(Range.begin(), Range.end()), 1);
  EXPECT_EQ(&*Range.begin(), BI1);

  ConstRange = CS->findByteIntervalsOn(Addr(0));
  ASSERT_EQ(std::distance(ConstRange.begin(), ConstRange.end()), 1);
  EXPECT_EQ(&*ConstRange.begin(), BI1);

  Range = S->findByteIntervalsOn(Addr(12));
  ASSERT_EQ(std::distance(Range.begin(), Range.end()), 2);
  EXPECT_EQ(&*std::next(Range.begin(), 0), BI1);
  EXPECT_EQ(&*std::next(Range.begin(), 1), BI2);

  ConstRange = CS->findByteIntervalsOn(Addr(12));
  ASSERT_EQ(std::distance(ConstRange.begin(), ConstRange.end()), 2);
  EXPECT_EQ(&*std::next(ConstRange.begin(), 0), BI1);
  EXPECT_EQ(&*std::next(ConstRange.begin(), 1), BI2);

  // Query is correct for ByteIntervals with overlapping start addresses.

  BI1->setAddress(Addr(13));
  Range = S->findByteIntervalsOn(Addr(14));
  ASSERT_EQ(std::distance(Range.begin(), Range.end()), 3);
  EXPECT_EQ(&*std::next(Range.begin(), 0), BI2);
  EXPECT_EQ(&*std::next(Range.begin(), 1), BI3);
  EXPECT_EQ(&*std::next(Range.begin(), 2), BI1);

  ConstRange = CS->findByteIntervalsOn(Addr(14));
  ASSERT_EQ(std::distance(ConstRange.begin(), ConstRange.end()), 3);
  EXPECT_EQ(&*std::next(ConstRange.begin(), 0), BI2);
  EXPECT_EQ(&*std::next(ConstRange.begin(), 1), BI3);
  EXPECT_EQ(&*std::next(ConstRange.begin(), 2), BI1);

  // Moving a ByteInterval does not leave duplicates in codomain tree.

  BI2->setAddress(Addr(13));
  Range = S->findByteIntervalsOn(Addr(14));
  ASSERT_EQ(std::distance(Range.begin(), Range.end()), 3);
  EXPECT_EQ(&*std::next(Range.begin(), 0), BI3);
  EXPECT_EQ(&*std::next(Range.begin(), 1), BI2);
  EXPECT_EQ(&*std::next(Range.begin(), 2), BI1);

  ConstRange = CS->findByteIntervalsOn(Addr(14));
  ASSERT_EQ(std::distance(ConstRange.begin(), ConstRange.end()), 3);
  EXPECT_EQ(&*std::next(ConstRange.begin(), 0), BI3);
  EXPECT_EQ(&*std::next(ConstRange.begin(), 1), BI2);
  EXPECT_EQ(&*std::next(ConstRange.begin(), 2), BI1);

  // Removing a ByteInterval with an overlapping address does not remove others.

  BI3->setAddress(std::nullopt);
  Range = S->findByteIntervalsOn(Addr(14));
  ASSERT_EQ(std::distance(Range.begin(), Range.end()), 2);
  EXPECT_EQ(&*std::next(Range.begin(), 0), BI2);
  EXPECT_EQ(&*std::next(Range.begin(), 1), BI1);

  ConstRange = CS->findByteIntervalsOn(Addr(14));
  ASSERT_EQ(std::distance(ConstRange.begin(), ConstRange.end()), 2);
  EXPECT_EQ(&*std::next(ConstRange.begin(), 0), BI2);
  EXPECT_EQ(&*std::next(ConstRange.begin(), 1), BI1);
}

TEST(Unit_Section, findByteIntervalsAt) {
  auto* S = Section::Create(Ctx, "test");
  auto* BI1 = S->addByteInterval(Ctx, 16);
  auto* BI2 = S->addByteInterval(Ctx, Addr(8), 16);
  const Section* CS = S;

  // Querying an out-of-bounds address returns an empty range.

  auto Range = S->findByteIntervalsAt(Addr(0));
  EXPECT_TRUE(Range.empty());

  auto ConstRange = CS->findByteIntervalsAt(Addr(0));
  EXPECT_TRUE(ConstRange.empty());

  // Querying exact start address returns the correct interval.

  Range = S->findByteIntervalsAt(Addr(8));
  ASSERT_EQ(std::distance(Range.begin(), Range.end()), 1);
  EXPECT_EQ(&*Range.begin(), BI2);

  ConstRange = CS->findByteIntervalsAt(Addr(8));
  ASSERT_EQ(std::distance(ConstRange.begin(), ConstRange.end()), 1);
  EXPECT_EQ(&*ConstRange.begin(), BI2);

  // Querying a range of addresses returns everything in range.

  Range = S->findByteIntervalsAt(Addr(0), Addr(static_cast<uint64_t>(-1)));
  ASSERT_EQ(std::distance(Range.begin(), Range.end()), 1);
  EXPECT_EQ(&*Range.begin(), BI2);

  ConstRange =
      CS->findByteIntervalsAt(Addr(0), Addr(static_cast<uint64_t>(-1)));
  ASSERT_EQ(std::distance(ConstRange.begin(), ConstRange.end()), 1);
  EXPECT_EQ(&*ConstRange.begin(), BI2);

  Range = S->findByteIntervalsAt(Addr(16), Addr(32));
  EXPECT_TRUE(Range.empty());

  ConstRange = CS->findByteIntervalsAt(Addr(16), Addr(32));
  EXPECT_TRUE(ConstRange.empty());

  // Querying an invalid address range returns an empty ByteInterval range.

  Range = S->findByteIntervalsAt(Addr(16), Addr(0));
  EXPECT_TRUE(Range.empty());

  ConstRange = CS->findByteIntervalsAt(Addr(16), Addr(0));
  EXPECT_TRUE(ConstRange.empty());

  // Changing the ByteInterval addresses changes the results.

  BI1->setAddress(Addr(4));
  Range = S->findByteIntervalsAt(Addr(0), Addr(32));
  ASSERT_EQ(std::distance(Range.begin(), Range.end()), 2);
  EXPECT_EQ(&*std::next(Range.begin(), 0), BI1);
  EXPECT_EQ(&*std::next(Range.begin(), 1), BI2);

  ConstRange = CS->findByteIntervalsAt(Addr(0), Addr(32));
  ASSERT_EQ(std::distance(ConstRange.begin(), ConstRange.end()), 2);
  EXPECT_EQ(&*std::next(ConstRange.begin(), 0), BI1);
  EXPECT_EQ(&*std::next(ConstRange.begin(), 1), BI2);
}

TEST(Unit_Section, findBlocksOn) {
  auto* S = Section::Create(Ctx, "test");
  auto* BI1 = S->addByteInterval(Ctx, 16);
  auto* CB11 = BI1->addBlock<CodeBlock>(Ctx, 0, 4);
  auto* BI2 = S->addByteInterval(Ctx, Addr(0), 10);
  auto* CB21 = BI2->addBlock<CodeBlock>(Ctx, 0, 2);
  auto* CB22 = BI2->addBlock<CodeBlock>(Ctx, 5, 2);
  auto* BI3 = S->addByteInterval(Ctx, Addr(4), 4);
  auto* CB31 = BI3->addBlock<CodeBlock>(Ctx, 0, 3);
  const Section* CS = S;

  // Querying an out-of-bounds offset produces an empty range.

  auto BlockRange = S->findBlocksOn(Addr(10));
  EXPECT_TRUE(BlockRange.empty());

  auto ConstBlockRange = CS->findBlocksOn(Addr(10));
  EXPECT_TRUE(ConstBlockRange.empty());

  // Querying an in-bounds offset returns the appropriate blocks from all
  // ByteIntervals.

  BlockRange = S->findBlocksOn(Addr(5));
  ASSERT_EQ(std::distance(BlockRange.begin(), BlockRange.end()), 2);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 0), CB31);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 1), CB22);

  ConstBlockRange = CS->findBlocksOn(Addr(5));
  ASSERT_EQ(std::distance(ConstBlockRange.begin(), ConstBlockRange.end()), 2);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 0), CB31);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 1), CB22);

  // Assigning a ByteInterval address may change the query results.

  BI1->setAddress(Addr(4));

  BlockRange = S->findBlocksOn(Addr(5));
  ASSERT_EQ(std::distance(BlockRange.begin(), BlockRange.end()), 3);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 0), CB31);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 1), CB11);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 2), CB22);

  ConstBlockRange = CS->findBlocksOn(Addr(5));
  ASSERT_EQ(std::distance(ConstBlockRange.begin(), ConstBlockRange.end()), 3);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 0), CB31);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 1), CB11);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 2), CB22);

  // Changing a ByteInterval's address may change the query results.

  BI2->setAddress(Addr(4));

  BlockRange = S->findBlocksOn(Addr(5));
  ASSERT_EQ(std::distance(BlockRange.begin(), BlockRange.end()), 3);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 0), CB21);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 1), CB31);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 2), CB11);

  ConstBlockRange = CS->findBlocksOn(Addr(5));
  ASSERT_EQ(std::distance(ConstBlockRange.begin(), ConstBlockRange.end()), 3);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 0), CB21);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 1), CB31);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 2), CB11);

  BI3->setAddress(Addr(0));

  BlockRange = S->findBlocksOn(Addr(5));
  ASSERT_EQ(std::distance(BlockRange.begin(), BlockRange.end()), 2);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 0), CB21);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 1), CB11);

  ConstBlockRange = CS->findBlocksOn(Addr(5));
  ASSERT_EQ(std::distance(ConstBlockRange.begin(), ConstBlockRange.end()), 2);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 0), CB21);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 1), CB11);
}

TEST(Unit_Section, findCodeBlocksOn) {
  auto* S = Section::Create(Ctx, "test");
  auto* BI1 = S->addByteInterval(Ctx, 16);
  auto* CB11 = BI1->addBlock<CodeBlock>(Ctx, 0, 4);
  auto* BI2 = S->addByteInterval(Ctx, Addr(0), 10);
  auto* CB21 = BI2->addBlock<CodeBlock>(Ctx, 0, 2);
  auto* CB22 = BI2->addBlock<CodeBlock>(Ctx, 5, 2);
  auto* BI3 = S->addByteInterval(Ctx, Addr(4), 4);
  auto* CB31 = BI3->addBlock<CodeBlock>(Ctx, 0, 3);
  const Section* CS = S;

  // Querying an out-of-bounds offset produces an empty range.

  auto BlockRange = S->findCodeBlocksOn(Addr(10));
  EXPECT_TRUE(BlockRange.empty());

  auto ConstBlockRange = CS->findCodeBlocksOn(Addr(10));
  EXPECT_TRUE(ConstBlockRange.empty());

  // Querying an in-bounds offset returns the appropriate blocks from all
  // ByteIntervals.

  BlockRange = S->findCodeBlocksOn(Addr(5));
  ASSERT_EQ(std::distance(BlockRange.begin(), BlockRange.end()), 2);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 0), CB31);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 1), CB22);

  ConstBlockRange = CS->findCodeBlocksOn(Addr(5));
  ASSERT_EQ(std::distance(ConstBlockRange.begin(), ConstBlockRange.end()), 2);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 0), CB31);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 1), CB22);

  // Assigning a ByteInterval address may change the query results.

  BI1->setAddress(Addr(4));

  BlockRange = S->findCodeBlocksOn(Addr(5));
  ASSERT_EQ(std::distance(BlockRange.begin(), BlockRange.end()), 3);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 0), CB31);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 1), CB11);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 2), CB22);

  ConstBlockRange = CS->findCodeBlocksOn(Addr(5));
  ASSERT_EQ(std::distance(ConstBlockRange.begin(), ConstBlockRange.end()), 3);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 0), CB31);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 1), CB11);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 2), CB22);

  // Changing a ByteInterval's address may change the query results.

  BI2->setAddress(Addr(4));

  BlockRange = S->findCodeBlocksOn(Addr(5));
  ASSERT_EQ(std::distance(BlockRange.begin(), BlockRange.end()), 3);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 0), CB21);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 1), CB31);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 2), CB11);

  ConstBlockRange = CS->findCodeBlocksOn(Addr(5));
  ASSERT_EQ(std::distance(ConstBlockRange.begin(), ConstBlockRange.end()), 3);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 0), CB21);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 1), CB31);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 2), CB11);

  BI3->setAddress(Addr(0));

  BlockRange = S->findCodeBlocksOn(Addr(5));
  ASSERT_EQ(std::distance(BlockRange.begin(), BlockRange.end()), 2);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 0), CB21);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 1), CB11);

  ConstBlockRange = CS->findCodeBlocksOn(Addr(5));
  ASSERT_EQ(std::distance(ConstBlockRange.begin(), ConstBlockRange.end()), 2);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 0), CB21);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 1), CB11);
}

TEST(Unit_Section, findDataBlocksOn) {
  auto* S = Section::Create(Ctx, "test");
  auto* BI1 = S->addByteInterval(Ctx, 16);
  auto* CB11 = BI1->addBlock<DataBlock>(Ctx, 0, 4);
  auto* BI2 = S->addByteInterval(Ctx, Addr(0), 10);
  auto* CB21 = BI2->addBlock<DataBlock>(Ctx, 0, 2);
  auto* CB22 = BI2->addBlock<DataBlock>(Ctx, 5, 2);
  auto* BI3 = S->addByteInterval(Ctx, Addr(4), 4);
  auto* CB31 = BI3->addBlock<DataBlock>(Ctx, 0, 3);
  const Section* CS = S;

  // Querying an out-of-bounds offset produces an empty range.

  auto BlockRange = S->findDataBlocksOn(Addr(10));
  EXPECT_TRUE(BlockRange.empty());

  auto ConstBlockRange = CS->findDataBlocksOn(Addr(10));
  EXPECT_TRUE(ConstBlockRange.empty());

  // Querying an in-bounds offset returns the appropriate blocks from all
  // ByteIntervals.

  BlockRange = S->findDataBlocksOn(Addr(5));
  ASSERT_EQ(std::distance(BlockRange.begin(), BlockRange.end()), 2);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 0), CB31);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 1), CB22);

  ConstBlockRange = CS->findDataBlocksOn(Addr(5));
  ASSERT_EQ(std::distance(ConstBlockRange.begin(), ConstBlockRange.end()), 2);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 0), CB31);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 1), CB22);

  // Assigning a ByteInterval address may change the query results.

  BI1->setAddress(Addr(4));

  BlockRange = S->findDataBlocksOn(Addr(5));
  ASSERT_EQ(std::distance(BlockRange.begin(), BlockRange.end()), 3);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 0), CB31);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 1), CB11);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 2), CB22);

  ConstBlockRange = CS->findDataBlocksOn(Addr(5));
  ASSERT_EQ(std::distance(ConstBlockRange.begin(), ConstBlockRange.end()), 3);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 0), CB31);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 1), CB11);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 2), CB22);

  // Changing a ByteInterval's address may change the query results.

  BI2->setAddress(Addr(4));

  BlockRange = S->findDataBlocksOn(Addr(5));
  ASSERT_EQ(std::distance(BlockRange.begin(), BlockRange.end()), 3);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 0), CB21);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 1), CB31);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 2), CB11);

  ConstBlockRange = CS->findDataBlocksOn(Addr(5));
  ASSERT_EQ(std::distance(ConstBlockRange.begin(), ConstBlockRange.end()), 3);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 0), CB21);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 1), CB31);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 2), CB11);

  BI3->setAddress(Addr(0));

  BlockRange = S->findDataBlocksOn(Addr(5));
  ASSERT_EQ(std::distance(BlockRange.begin(), BlockRange.end()), 2);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 0), CB21);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 1), CB11);

  ConstBlockRange = CS->findDataBlocksOn(Addr(5));
  ASSERT_EQ(std::distance(ConstBlockRange.begin(), ConstBlockRange.end()), 2);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 0), CB21);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 1), CB11);
}

TEST(Unit_Section, findBlocksAt) {
  auto* S = Section::Create(Ctx, "test");
  auto* BI1 = S->addByteInterval(Ctx, 16);
  auto* CB11 = BI1->addBlock<CodeBlock>(Ctx, 0, 4);
  auto* BI2 = S->addByteInterval(Ctx, Addr(0), 10);
  auto* CB21 = BI2->addBlock<CodeBlock>(Ctx, 0, 2);
  auto* CB22 = BI2->addBlock<CodeBlock>(Ctx, 5, 2);
  auto* BI3 = S->addByteInterval(Ctx, Addr(4), 4);
  auto* CB31 = BI3->addBlock<CodeBlock>(Ctx, 0, 3);
  const Section* CS = S;

  // Querying an out-of-bounds offset produces an empty range.

  auto BlockRange = S->findBlocksAt(Addr(10), Addr(20));
  EXPECT_TRUE(BlockRange.empty());

  auto ConstBlockRange = CS->findBlocksAt(Addr(10), Addr(20));
  EXPECT_TRUE(ConstBlockRange.empty());

  // Querying an in-bounds offset returns the appropriate blocks from all
  // ByteIntervals.

  BlockRange = S->findBlocksAt(Addr(3), Addr(6));
  ASSERT_EQ(std::distance(BlockRange.begin(), BlockRange.end()), 2);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 0), CB31);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 1), CB22);

  ConstBlockRange = CS->findBlocksAt(Addr(3), Addr(6));
  ASSERT_EQ(std::distance(ConstBlockRange.begin(), ConstBlockRange.end()), 2);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 0), CB31);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 1), CB22);

  // Assigning a ByteInterval address may change the query results.

  BI1->setAddress(Addr(4));

  BlockRange = S->findBlocksAt(Addr(3), Addr(6));
  ASSERT_EQ(std::distance(BlockRange.begin(), BlockRange.end()), 3);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 0), CB31);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 1), CB11);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 2), CB22);

  ConstBlockRange = CS->findBlocksAt(Addr(3), Addr(6));
  ASSERT_EQ(std::distance(ConstBlockRange.begin(), ConstBlockRange.end()), 3);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 0), CB31);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 1), CB11);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 2), CB22);

  // Changing a ByteInterval's address may change the query results.

  BI2->setAddress(Addr(4));

  BlockRange = S->findBlocksAt(Addr(3), Addr(6));
  ASSERT_EQ(std::distance(BlockRange.begin(), BlockRange.end()), 3);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 0), CB21);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 1), CB31);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 2), CB11);

  ConstBlockRange = CS->findBlocksAt(Addr(3), Addr(6));
  ASSERT_EQ(std::distance(ConstBlockRange.begin(), ConstBlockRange.end()), 3);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 0), CB21);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 1), CB31);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 2), CB11);

  BI3->setAddress(Addr(0));

  BlockRange = S->findBlocksAt(Addr(3), Addr(6));
  ASSERT_EQ(std::distance(BlockRange.begin(), BlockRange.end()), 2);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 0), CB21);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 1), CB11);

  ConstBlockRange = CS->findBlocksAt(Addr(3), Addr(6));
  ASSERT_EQ(std::distance(ConstBlockRange.begin(), ConstBlockRange.end()), 2);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 0), CB21);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 1), CB11);
}

TEST(Unit_Section, findCodeBlocksAt) {
  auto* S = Section::Create(Ctx, "test");
  auto* BI1 = S->addByteInterval(Ctx, 16);
  auto* CB11 = BI1->addBlock<CodeBlock>(Ctx, 0, 4);
  auto* BI2 = S->addByteInterval(Ctx, Addr(0), 10);
  auto* CB21 = BI2->addBlock<CodeBlock>(Ctx, 0, 2);
  auto* CB22 = BI2->addBlock<CodeBlock>(Ctx, 5, 2);
  auto* BI3 = S->addByteInterval(Ctx, Addr(4), 4);
  auto* CB31 = BI3->addBlock<CodeBlock>(Ctx, 0, 3);
  const Section* CS = S;

  // Querying an out-of-bounds offset produces an empty range.

  auto BlockRange = S->findCodeBlocksAt(Addr(10), Addr(20));
  EXPECT_TRUE(BlockRange.empty());

  auto ConstBlockRange = CS->findCodeBlocksAt(Addr(10), Addr(20));
  EXPECT_TRUE(ConstBlockRange.empty());

  // Querying an in-bounds offset returns the appropriate blocks from all
  // ByteIntervals.

  BlockRange = S->findCodeBlocksAt(Addr(3), Addr(6));
  ASSERT_EQ(std::distance(BlockRange.begin(), BlockRange.end()), 2);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 0), CB31);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 1), CB22);

  ConstBlockRange = CS->findCodeBlocksAt(Addr(3), Addr(6));
  ASSERT_EQ(std::distance(ConstBlockRange.begin(), ConstBlockRange.end()), 2);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 0), CB31);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 1), CB22);

  // Assigning a ByteInterval address may change the query results.

  BI1->setAddress(Addr(4));

  BlockRange = S->findCodeBlocksAt(Addr(3), Addr(6));
  ASSERT_EQ(std::distance(BlockRange.begin(), BlockRange.end()), 3);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 0), CB31);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 1), CB11);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 2), CB22);

  ConstBlockRange = CS->findCodeBlocksAt(Addr(3), Addr(6));
  ASSERT_EQ(std::distance(ConstBlockRange.begin(), ConstBlockRange.end()), 3);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 0), CB31);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 1), CB11);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 2), CB22);

  // Changing a ByteInterval's address may change the query results.

  BI2->setAddress(Addr(4));

  BlockRange = S->findCodeBlocksAt(Addr(3), Addr(6));
  ASSERT_EQ(std::distance(BlockRange.begin(), BlockRange.end()), 3);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 0), CB21);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 1), CB31);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 2), CB11);

  ConstBlockRange = CS->findCodeBlocksAt(Addr(3), Addr(6));
  ASSERT_EQ(std::distance(ConstBlockRange.begin(), ConstBlockRange.end()), 3);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 0), CB21);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 1), CB31);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 2), CB11);

  BI3->setAddress(Addr(0));

  BlockRange = S->findCodeBlocksAt(Addr(3), Addr(6));
  ASSERT_EQ(std::distance(BlockRange.begin(), BlockRange.end()), 2);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 0), CB21);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 1), CB11);

  ConstBlockRange = CS->findCodeBlocksAt(Addr(3), Addr(6));
  ASSERT_EQ(std::distance(ConstBlockRange.begin(), ConstBlockRange.end()), 2);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 0), CB21);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 1), CB11);
}

TEST(Unit_Section, findDataBlocksAt) {
  auto* S = Section::Create(Ctx, "test");
  auto* BI1 = S->addByteInterval(Ctx, 16);
  auto* CB11 = BI1->addBlock<DataBlock>(Ctx, 0, 4);
  auto* BI2 = S->addByteInterval(Ctx, Addr(0), 10);
  auto* CB21 = BI2->addBlock<DataBlock>(Ctx, 0, 2);
  auto* CB22 = BI2->addBlock<DataBlock>(Ctx, 5, 2);
  auto* BI3 = S->addByteInterval(Ctx, Addr(4), 4);
  auto* CB31 = BI3->addBlock<DataBlock>(Ctx, 0, 3);
  const Section* CS = S;

  // Querying an out-of-bounds offset produces an empty range.

  auto BlockRange = S->findDataBlocksAt(Addr(10), Addr(20));
  EXPECT_TRUE(BlockRange.empty());

  auto ConstBlockRange = CS->findDataBlocksAt(Addr(10), Addr(20));
  EXPECT_TRUE(ConstBlockRange.empty());

  // Querying an in-bounds offset returns the appropriate blocks from all
  // ByteIntervals.

  BlockRange = S->findDataBlocksAt(Addr(3), Addr(6));
  ASSERT_EQ(std::distance(BlockRange.begin(), BlockRange.end()), 2);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 0), CB31);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 1), CB22);

  ConstBlockRange = CS->findDataBlocksAt(Addr(3), Addr(6));
  ASSERT_EQ(std::distance(ConstBlockRange.begin(), ConstBlockRange.end()), 2);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 0), CB31);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 1), CB22);

  // Assigning a ByteInterval address may change the query results.

  BI1->setAddress(Addr(4));

  BlockRange = S->findDataBlocksAt(Addr(3), Addr(6));
  ASSERT_EQ(std::distance(BlockRange.begin(), BlockRange.end()), 3);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 0), CB31);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 1), CB11);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 2), CB22);

  ConstBlockRange = CS->findDataBlocksAt(Addr(3), Addr(6));
  ASSERT_EQ(std::distance(ConstBlockRange.begin(), ConstBlockRange.end()), 3);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 0), CB31);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 1), CB11);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 2), CB22);

  // Changing a ByteInterval's address may change the query results.

  BI2->setAddress(Addr(4));

  BlockRange = S->findDataBlocksAt(Addr(3), Addr(6));
  ASSERT_EQ(std::distance(BlockRange.begin(), BlockRange.end()), 3);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 0), CB21);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 1), CB31);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 2), CB11);

  ConstBlockRange = CS->findDataBlocksAt(Addr(3), Addr(6));
  ASSERT_EQ(std::distance(ConstBlockRange.begin(), ConstBlockRange.end()), 3);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 0), CB21);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 1), CB31);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 2), CB11);

  BI3->setAddress(Addr(0));

  BlockRange = S->findDataBlocksAt(Addr(3), Addr(6));
  ASSERT_EQ(std::distance(BlockRange.begin(), BlockRange.end()), 2);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 0), CB21);
  EXPECT_EQ(&*std::next(BlockRange.begin(), 1), CB11);

  ConstBlockRange = CS->findDataBlocksAt(Addr(3), Addr(6));
  ASSERT_EQ(std::distance(ConstBlockRange.begin(), ConstBlockRange.end()), 2);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 0), CB21);
  EXPECT_EQ(&*std::next(ConstBlockRange.begin(), 1), CB11);
}

TEST(Unit_Section, testIterationOrder) {
  auto* S = Section::Create(Ctx, "test");
  auto* BI1 = S->addByteInterval(Ctx, Addr(0));
  auto* CB11 = BI1->addBlock<CodeBlock>(Ctx, 0, 0);
  auto* CB12 = BI1->addBlock<CodeBlock>(Ctx, 0, 1);
  auto* BI2 = S->addByteInterval(Ctx, Addr(0));
  auto* DB21 = BI2->addBlock<DataBlock>(Ctx, 0, 0);
  auto* DB22 = BI2->addBlock<DataBlock>(Ctx, 0, 1);
  auto* BI3 = S->addByteInterval(Ctx, Addr(1));
  auto* DB31 = BI3->addBlock<DataBlock>(Ctx, 0, 0);
  auto* DB32 = BI3->addBlock<DataBlock>(Ctx, 0, 1);

  {
    std::vector<Node*> ExpectedOrder = {CB11, DB21, CB12, DB22, DB31, DB32};
    EXPECT_EQ(pointers(S->blocks()), ExpectedOrder);
  }
}


================================================
FILE: src/test/SerializationTestHarness.hpp
================================================
//===- SerializationTestHarness.hpp -----------------------------*- C++ -*-===//
//
//  Copyright (C) 2020 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//

#ifndef SERIALIZATION_TEST_HARNESS_HPP
#define SERIALIZATION_TEST_HARNESS_HPP

#include <gtirb/ByteInterval.hpp>
#include <gtirb/CFG.hpp>
#include <gtirb/CodeBlock.hpp>
#include <gtirb/DataBlock.hpp>
#include <gtirb/IR.hpp>
#include <gtirb/Module.hpp>
#include <gtirb/Section.hpp>
#include <gtirb/Symbol.hpp>
#include <iostream>

namespace gtirb {

// This is a utility class that allows unit tests to access the
// private serialization primitives for individual GTIRB classes. All
// GTIRB classes be-friend this class so they don't have to be-friend
// all the individual unit tests.
//
// Note: this class accesses the save/load member functions in each
// GTIRB class, not the to/fromProtobuf functions, as we do not want
// protobuf Message instances allocated here or in the unit test
// code. If they were allocated here, we would have problems on
// Windows due to protobuf not being dllexported in the gtirb.so
// library.
class SerializationTestHarness {
public:
  template <typename T> static void save(const T& Val, std::ostream& Out) {
    Val.save(Out);
  }

  template <typename T> static auto load(Context& C, std::istream& In) {
    return T::load(C, In);
  }

  template <typename T, typename P>
  static auto load(Context& C, P* Parent, std::istream& In) {
    return T::load(C, Parent, In);
  }

  static bool byteIntervalLoadSymbolicExpressions(Context& Ctx,
                                                  ByteInterval& BI,
                                                  std::istream& In) {
    return BI.loadSymbolicExpressions(Ctx, In);
  }
};

template <>
inline auto SerializationTestHarness::load<IR>(Context& C, std::istream& In) {
  ErrorOr<IR*> Result = IR::load(C, In);
  if (Result)
    return *Result;
  return static_cast<IR*>(nullptr);
}

// Serializaton for CFGs, for which there isn't a class-level protobuf
// concept in the C++ API.
void GTIRB_EXPORT_API cfgSave(const CFG& Cfg, std::ostream& Out);
void GTIRB_EXPORT_API cfgLoad(Context& C, CFG& Result, std::istream& In);

// Serialization for SymbolicExpressions
void GTIRB_EXPORT_API symbolicExpressionSave(const SymbolicExpression& SE,
                                             std::ostream& Out);
void GTIRB_EXPORT_API symbolicExpressionLoad(Context& C,
                                             SymbolicExpression& Result,
                                             std::istream& In);

} // namespace gtirb

#endif // SERIALIZATION_TEST_HARNESS_HPP


================================================
FILE: src/test/Symbol.test.cpp
================================================
//===- Symbol.test.cpp ------------------------------------------*- C++ -*-===//
//
//  Copyright (C) 2020 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
#include "SerializationTestHarness.hpp"
#include <gtirb/CfgNode.hpp>
#include <gtirb/CodeBlock.hpp>
#include <gtirb/Context.hpp>
#include <gtirb/DataBlock.hpp>
#include <gtirb/Module.hpp>
#include <gtirb/ProxyBlock.hpp>
#include <gtirb/Symbol.hpp>
#include <gtirb/proto/Symbol.pb.h>
#include <gtest/gtest.h>
#include <sstream>

using namespace gtirb;

static Context Ctx;

TEST(Unit_Symbol, noCopyMoveConstructors) {
  EXPECT_FALSE(std::is_copy_constructible_v<Symbol>);
  EXPECT_FALSE(std::is_move_constructible_v<Symbol>);
  EXPECT_FALSE(std::is_copy_assignable_v<Symbol>);
  EXPECT_FALSE(std::is_move_assignable_v<Symbol>);
}

TEST(Unit_Symbol, ctor_0) { EXPECT_NE(Symbol::Create(Ctx, "test"), nullptr); }

TEST(Unit_Symbol, setReferent) {
  auto* Mod = Module::Create(Ctx, "test");
  auto* Sym = Mod->addSymbol(Ctx, "test");
  auto* S = Mod->addSection(Ctx, "test");
  auto* BI = S->addByteInterval(Ctx, Addr(0), 4);
  auto* Data = BI->addBlock<DataBlock>(Ctx, 0, 2);
  auto* B = BI->addBlock<CodeBlock>(Ctx, 1, 2);
  auto* Proxy = Mod->addProxyBlock(Ctx);

  // Symbol should have no referent yet.
  EXPECT_EQ(Sym->getReferent<Node>(), nullptr);
  EXPECT_FALSE(Sym->getAddress());
  EXPECT_FALSE(Sym->hasReferent());

  Sym->setReferent(Data);
  EXPECT_EQ(Sym->getReferent<CodeBlock>(), nullptr);
  EXPECT_EQ(Sym->getReferent<DataBlock>(), Data);
  EXPECT_EQ(Sym->getReferent<ProxyBlock>(), nullptr);
  EXPECT_EQ(Sym->getAddress(), Addr(0));
  EXPECT_TRUE(Sym->hasReferent());

  Sym->setReferent(B);
  EXPECT_EQ(Sym->getReferent<CodeBlock>(), B);
  EXPECT_EQ(Sym->getReferent<DataBlock>(), nullptr);
  EXPECT_EQ(Sym->getReferent<ProxyBlock>(), nullptr);
  EXPECT_EQ(Sym->getAddress(), Addr(1));
  EXPECT_TRUE(Sym->hasReferent());

  Sym->setReferent(Proxy);
  EXPECT_EQ(Sym->getReferent<CodeBlock>(), nullptr);
  EXPECT_EQ(Sym->getReferent<DataBlock>(), nullptr);
  EXPECT_EQ(Sym->getReferent<ProxyBlock>(), Proxy);
  EXPECT_FALSE(Sym->getAddress());
  EXPECT_TRUE(Sym->hasReferent());

  Sym->setReferent<DataBlock>(nullptr);
  EXPECT_EQ(Sym->getReferent<Node>(), nullptr);
  EXPECT_FALSE(Sym->getAddress());
  EXPECT_FALSE(Sym->hasReferent());
}

TEST(Unit_Symbol, protobufRoundTrip) {
  using STH = gtirb::SerializationTestHarness;
  std::stringstream sym_ss;
  std::stringstream mod_ss;
  UUID DataUUID;

  // Symbol with referent
  {
    Context InnerCtx;
    auto* Mod = Module::Create(InnerCtx, "test");
    auto* Original = Symbol::Create(InnerCtx, "test");

    auto* S = Mod->addSection(InnerCtx, "test");
    auto* BI = S->addByteInterval(InnerCtx, Addr(0), 10);
    auto* Data = BI->addBlock<DataBlock>(InnerCtx, 1, 1);
    DataUUID = Data->getUUID();
    Original->setReferent(Data);

    STH::save(*Original, sym_ss);

    // We must manually serialize the symbol referent. This would typically be
    // done automatically for the user when they serialized the IR.
    STH::save(*Mod, mod_ss);
  }

  {
    Context InnerCtx;
    (void)STH::load<Module>(InnerCtx, mod_ss); // See above.
    auto* Result = STH::load<Symbol>(InnerCtx, sym_ss);

    EXPECT_EQ(Result->getAddress(), Addr(1));
    EXPECT_EQ(Result->getName(), "test");
    EXPECT_EQ(Result->getReferent<DataBlock>()->getUUID(), DataUUID);
    EXPECT_EQ(Result->getReferent<CodeBlock>(), nullptr);
  }

  // Symbol with address
  std::stringstream sym_ss2;
  {
    Context InnerCtx;
    auto* Original = Symbol::Create(InnerCtx, Addr(2), "test");
    STH::save(*Original, sym_ss2);
  }

  {
    Context InnerCtx;
    auto* Result = STH::load<Symbol>(InnerCtx, sym_ss2);

    EXPECT_EQ(Result->getAddress(), Addr(2));
    EXPECT_EQ(Result->getName(), "test");
    EXPECT_EQ(Result->getReferent<DataBlock>(), nullptr);
    EXPECT_EQ(Result->getReferent<CodeBlock>(), nullptr);
  }

  // Symbol without address
  std::stringstream sym_ss3;
  {
    Context InnerCtx;
    auto* Original = Symbol::Create(InnerCtx, "test");
    STH::save(*Original, sym_ss3);
  }

  {
    Context InnerCtx;
    auto* Result = STH::load<Symbol>(InnerCtx, sym_ss3);
    EXPECT_FALSE(Result->getAddress());
    EXPECT_EQ(Result->getName(), "test");
  }
}

TEST(Unit_Symbol, visitation) {
  auto* Sym = Symbol::Create(Ctx, CodeBlock::Create(Ctx, 2), "test");
  auto* NoRef = Symbol::Create(Ctx, "test2");

  struct Visitor {
    int operator()(CodeBlock* B) {
      // This should not be called with a null pointer.
      EXPECT_NE(B, nullptr);
      return 0;
    }
    long operator()(DataBlock*) {
      // This overload should never be called.
      EXPECT_TRUE(false);
      return 1;
    }
    long operator()(ProxyBlock*) {
      // This overload should never be called.
      EXPECT_TRUE(false);
      return 1;
    }
  };
  EXPECT_EQ(0, *Sym->visit(Visitor{}));

  // The version that has no referent should not call any of the visitor
  // functions and the returned optional should not have a value.
  struct NoRefVisitor {
    int operator()(const CfgNode*) const {
      EXPECT_TRUE(false);
      return 0;
    }
    int operator()(const DataBlock*) const {
      EXPECT_TRUE(false);
      return 1;
    }
  };
  EXPECT_FALSE(NoRef->visit(NoRefVisitor{}));

  // Similar to the test above, but ensuring we can visit without a return type.
  struct ConstVoidVisitor {
    void operator()(const CfgNode* N) const { EXPECT_NE(N, nullptr); }
    void operator()(const DataBlock*) const { EXPECT_TRUE(false); }
  };
  Sym->visit(ConstVoidVisitor{});

  // Ensure that we can provide a visitor that uses a base type.
  struct GenericVisitor {
    void operator()(const Node* N) const {
      EXPECT_NE(N, nullptr);
      // This should still only be called once.
      static int Counter;
      EXPECT_EQ(Counter++, 0);
    }
  };
  Sym->visit(GenericVisitor{});

  // Ensure that we can provide a lambda as a callable.
  Sym->visit([](const Node* N) {
    EXPECT_NE(N, nullptr);
    // This should still only be called once.
    static int Counter;
    EXPECT_EQ(Counter++, 0);
  });

  // The following is example code that should not compile. We cannot use gtest
  // to ensure that we get the appropriate compile errors, unfortunately.
  // struct NotEnoughOverloads {
  //  void operator()(const Block*) {}
  //};
  // Sym->visit(NotEnoughOverloads{}); // Error

  // struct IncorrectReturnTypes {
  //  std::string operator()(Block*) { return ""; }
  //  int operator()(DataBlock*) { return 0; }
  //};
  // Sym->visit(IncorrectReturnTypes{}); // Error
}

TEST(Unit_Symbol, atEnd) {
  auto* Mod = Module::Create(Ctx, "test");
  auto* Sym = Mod->addSymbol(Ctx, "test");
  auto* S = Mod->addSection(Ctx, "test");
  auto* BI = S->addByteInterval(Ctx, Addr(0), 4);
  auto* Data = BI->addBlock<DataBlock>(Ctx, 0, 2);
  auto* B = BI->addBlock<CodeBlock>(Ctx, 1, 2);

  Sym->setReferent(B);
  Sym->setAtEnd(true);
  EXPECT_EQ(Sym->getAddress(), gtirb::Addr{3});

  Sym->setReferent(B);
  Sym->setAtEnd(false);
  EXPECT_EQ(Sym->getAddress(), gtirb::Addr{1});

  Sym->setReferent(Data);
  Sym->setAtEnd(true);
  EXPECT_EQ(Sym->getAddress(), gtirb::Addr{2});

  Sym->setReferent(Data);
  Sym->setAtEnd(false);
  EXPECT_EQ(Sym->getAddress(), gtirb::Addr{0});
}


================================================
FILE: src/test/SymbolicExpression.test.cpp
================================================
//===- SymbolicExpression.test.cpp ------------------------------*- C++ -*-===//
//
//  Copyright (C) 2020 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
#include "SerializationTestHarness.hpp"
#include <gtirb/Context.hpp>
#include <gtirb/Symbol.hpp>
#include <gtirb/SymbolicExpression.hpp>
#include <gtirb/proto/SymbolicExpression.pb.h>
#include <gtest/gtest.h>
#include <sstream>

using namespace gtirb;

static Context Ctx;

TEST(Unit_SymbolicExpression, protobufRoundTrip) {
  Symbol* Sym1 = Symbol::Create(Ctx, Addr(1), "test1");
  Symbol* Sym2 = Symbol::Create(Ctx, Addr(2), "test2");

  // SymAddrConst
  {
    SymAttributeSet OrigSASet;
    OrigSASet.insert({SymAttribute::ABS, SymAttribute::G0});
    SymbolicExpression original(SymAddrConst{1, Sym1, OrigSASet});

    gtirb::SymbolicExpression Result;
    std::stringstream ss;
    symbolicExpressionSave(original, ss);
    symbolicExpressionLoad(Ctx, Result, ss);

    SymAddrConst S = std::get<SymAddrConst>(Result);
    EXPECT_EQ(S.Offset, 1);
    EXPECT_EQ(S.Sym->getName(), "test1");
    EXPECT_EQ(S.Attributes, OrigSASet);
  }

  // SymAddrAddr
  {
    SymbolicExpression original(SymAddrAddr{1, 2, Sym1, Sym2});

    gtirb::SymbolicExpression Result;
    std::stringstream ss;
    symbolicExpressionSave(original, ss);
    symbolicExpressionLoad(Ctx, Result, ss);

    SymAddrAddr S = std::get<SymAddrAddr>(Result);
    EXPECT_EQ(S.Scale, 1);
    EXPECT_EQ(S.Offset, 2);
    EXPECT_EQ(S.Sym1->getName(), "test1");
    EXPECT_EQ(S.Sym2->getName(), "test2");
  }
}

TEST(Unit_SymAttributeSet, unknownAttributes) {
  std::ostringstream Out;
  {
    auto* I = IR::Create(Ctx);
    auto* M = I->addModule(Ctx, "foo");
    auto* S = M->addSection(Ctx, "bar");
    auto* B = S->addByteInterval(Ctx, Addr(0), 8);

    Symbol* Sym = Symbol::Create(Ctx, Addr(4), "baz");
    SymAttributeSet Attrs{SymAttribute::GOT, static_cast<SymAttribute>(0xBEEF)};
    B->addSymbolicExpression<SymAddrConst>(4, SymAddrConst{0, Sym, Attrs});

    I->save(Out);
  }

  std::istringstream In(Out.str());
  {
    auto ResultOrErr = IR::load(Ctx, In);
    ASSERT_TRUE(ResultOrErr);

    auto* I = *ResultOrErr;
    EXPECT_EQ(std::distance(I->symbolic_expressions_begin(),
                            I->symbolic_expressions_end()),
              1);
    EXPECT_TRUE(std::holds_alternative<SymAddrConst>(
        I->symbolic_expressions_begin()->getSymbolicExpression()));

    SymAttributeSet Attrs =
        std::get<SymAddrConst>(
            I->symbolic_expressions_begin()->getSymbolicExpression())
            .Attributes;
    EXPECT_EQ(Attrs.count(SymAttribute::GOT), 1);
    EXPECT_EQ(Attrs.count(static_cast<SymAttribute>(0xBEEF)), 1);
  }
}


================================================
FILE: src/test/TestHelpers.hpp
================================================
//===- TestHelpers.hpp ------------------------------------------*- C++ -*-===//
//
//  Copyright (C) 2024 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//

#ifndef GTIRB_TEST_HELPERS_H
#define GTIRB_TEST_HELPERS_H

#include <boost/iterator/transform_iterator.hpp>
#include <boost/range/iterator_range.hpp>

// Transforms a range of references into a range of pointers.
template <typename RangeTy> auto pointers(const RangeTy& Range) {
  auto GetPointer = [](auto& arg) { return &arg; };
  return boost::make_iterator_range(
      boost::make_transform_iterator(Range.begin(), GetPointer),
      boost::make_transform_iterator(Range.end(), GetPointer));
}

#endif // GTIRB_TEST_HELPERS_H


================================================
FILE: src/test/TypedNodeTest.cpp
================================================
//===- TypedNodeTest.cpp ----------------------------------------*- C++ -*-===//
//
//  Copyright (C) 2020 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
#include "SerializationTestHarness.hpp"
#include <gtirb/CodeBlock.hpp>
#include <gtirb/Context.hpp>
#include <gtirb/DataBlock.hpp>
#include <gtirb/IR.hpp>
#include <gtirb/Module.hpp>
#include <gtirb/Section.hpp>
#include <gtirb/Symbol.hpp>
#include <gtirb/SymbolicExpression.hpp>
#include <gtirb/proto/IR.pb.h>
#include <gtirb/proto/Module.pb.h>
#include <gtirb/proto/Section.pb.h>
#include <gtirb/proto/Symbol.pb.h>
#include <boost/uuid/uuid_generators.hpp>
#include <gtest/gtest.h>
#include <sstream>
#include <type_traits>

using testing::Types;

typedef Types<gtirb::ByteInterval*, //
              gtirb::CodeBlock*,    //
              gtirb::DataBlock*,    //
              gtirb::IR*,           //
              gtirb::Module*,       //
              gtirb::ProxyBlock*,   //
              gtirb::Section*,      //
              gtirb::Symbol*        //
              >
    TypeImplementations;

static gtirb::Context Ctx;

// ----------------------------------------------------------------------------
// Helper for constructing nodes. Most nodes can be created with no arguments
// and can use the main template. But the template can be specialized for node
// types that require constructor arguments (e.g., Module).

template <class T> auto Create(gtirb::Context& C) { return T::Create(C); }

template <> auto Create<gtirb::Module>(gtirb::Context& C) {
  return gtirb::Module::Create(C, "test");
}

// ----------------------------------------------------------------------------
// Typed test fixture.

template <class T> class TypedNodeTest : public testing::Test {
protected:
  TypedNodeTest() = default;
  virtual ~TypedNodeTest() = default;
};

TYPED_TEST_SUITE_P(TypedNodeTest);

// I tried making this a member of TypedNodeTest, but the member is unavailable
// within the tests themselves, so this macro is used as a hacky solution.
#define Type std::remove_pointer_t<TypeParam>

// ----------------------------------------------------------------------------
// Tests to run on all types.

TYPED_TEST_P(TypedNodeTest, ctor_0) { EXPECT_NE(Create<Type>(Ctx), nullptr); }

TYPED_TEST_P(TypedNodeTest, uniqueUuids) {
  std::vector<gtirb::UUID> Uuids;
  // Create a bunch of UUID's, then make sure we don't have any duplicates.

  for (size_t I = 0; I < 64; ++I) {
    const TypeParam N = Create<Type>(Ctx);
    Uuids.push_back(N->getUUID());
  }

  std::sort(std::begin(Uuids), std::end(Uuids));
  const auto end = std::unique(std::begin(Uuids), std::end(Uuids));

  EXPECT_EQ(std::end(Uuids), end) << "Duplicate UUID's were generated.";
}

TYPED_TEST_P(TypedNodeTest, getByUUID) {
  TypeParam Node = Create<Type>(Ctx);
  EXPECT_EQ(gtirb::Node::getByUUID(Ctx, Node->getUUID()), Node);
}

TYPED_TEST_P(TypedNodeTest, protobufUUIDRoundTrip) {
  using STH = gtirb::SerializationTestHarness;
  std::stringstream ss;
  gtirb::UUID OrigId;
  {
    gtirb::Context InnerCtx;
    TypeParam Node1 = Create<Type>(InnerCtx);
    OrigId = Node1->getUUID();

    STH::save(*Node1, ss);
  }

  TypeParam Node2 = STH::load<Type>(Ctx, ss);
  EXPECT_EQ(Node2->getUUID(), OrigId);
}

TYPED_TEST_P(TypedNodeTest, deserializeUpdatesUUIDMap) {
  using STH = gtirb::SerializationTestHarness;
  gtirb::UUID Id;
  std::stringstream ss;

  {
    gtirb::Context InnerCtx;
    TypeParam Node1 = Create<Type>(InnerCtx);
    Id = Node1->getUUID();

    STH::save(*Node1, ss);
  }

  EXPECT_EQ(Type::getByUUID(Ctx, Id), nullptr);

  TypeParam Node2 = STH::load<Type>(Ctx, ss);
  EXPECT_EQ(Type::getByUUID(Ctx, Id), Node2);
}

REGISTER_TYPED_TEST_SUITE_P(TypedNodeTest,             //
                            protobufUUIDRoundTrip,     //
                            ctor_0,                    //
                            uniqueUuids,               //
                            deserializeUpdatesUUIDMap, //
                            getByUUID);

INSTANTIATE_TYPED_TEST_SUITE_P(Unit_Nodes,           // Instance name
                               TypedNodeTest,        // Test case name
                               TypeImplementations); // Type list


================================================
FILE: src/test/UtilsDeprecatedGlobals.test.cpp
================================================
//===- UtilsDeprecatedGlobals.test.cpp --------------------------*- C++ -*-===//
//
//  Copyright (C) 2024 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
#include <gtirb/Allocator.hpp>
#include <gtest/gtest.h>

/*
Ensure it is possible to use utility functions with no namespace if
GTIRB_WRAP_UTILS_IN_NAMESPACE is not defined.
*/
TEST(Unit_IR, globalNextPowerOfTwo) { EXPECT_EQ(NextPowerOf2(5), 8U); }


================================================
FILE: src/test/UtilsUsingGtirbNamespace.test.cpp
================================================
//===- UtilsUsingGtirbNamespace.test.cpp ------------------------*- C++ -*-===//
//
//  Copyright (C) 2024 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
#define GTIRB_WRAP_UTILS_IN_NAMESPACE
#include <gtirb/Allocator.hpp>
#include <gtest/gtest.h>

/*
Ensure it is possible to use utility functions by using the gtirb namesapce when
GTIRB_WRAP_UTILS_IN_NAMESPACE is defined.
*/
using namespace gtirb;
TEST(Unit_IR, namespacedNextPowerOfTwo) { EXPECT_EQ(NextPowerOf2(5), 8U); }
TEST(Unit_IR, explicitNamespacedNextPowerOfTwo) {
  EXPECT_EQ(gtirb::NextPowerOf2(5), 8U);
}


================================================
FILE: src/test/config-test.h.in
================================================
#cmakedefine HAVE_RESOURCE_H 1


================================================
FILE: src/test/runtests.cmake
================================================
# This is a short script that manages passing a gtirb file between two test
# executables. The first is expected to create the gtirb file. The second is
# expected to consume the file. The filename is passed as argv[1] to both
# executables. The file is removed after both have run.

macro(EXEC_CHECK CMD)
  execute_process(COMMAND ${CMD} ${ARGN} RESULT_VARIABLE CMD_RESULT)
  if(CMD_RESULT)
    message(FATAL_ERROR "Error running ${CMD} ${ARGN}")
  endif()
endmacro()
set(GTIRB_FILENAME testfile.gtirb)
exec_check("${CMD1}" "${GTIRB_FILENAME}")
exec_check("${CMD2}" "${GTIRB_FILENAME}")
file(REMOVE ${GTIRB_FILENAME})


================================================
FILE: src/test/testInputBinary/CMakeLists.txt
================================================
# Generate several projects of increasing size and complexity for use in testing
# GTIRB.
macro(GTIRB_BUILD_GTBINARY_MACRO)
  set(PROJECT_NAME gtirbTestInputBinary${_GENERATION_CONSTANT})

  set(${PROJECT_NAME}_H)

  set(${PROJECT_NAME}_SRC TestInputBinary.cpp)

  if(UNIX AND NOT WIN32)
    set(SYSLIBS ${CMAKE_DL_LIBS})
  else()
    set(SYSLIBS)
  endif()

  add_executable(${PROJECT_NAME} ${${PROJECT_NAME}_H} ${${PROJECT_NAME}_SRC})

  set_property(TARGET ${PROJECT_NAME} PROPERTY FOLDER "gtirb/test")

  target_compile_definitions(
    ${PROJECT_NAME} PRIVATE -DGENERATION_CONSTANT=${_GENERATION_CONSTANT}
  )

  target_link_libraries(${PROJECT_NAME} ${SYSLIBS})
endmacro()

set(_GENERATION_CONSTANT 2)
gtirb_build_gtbinary_macro()

set(_GENERATION_CONSTANT 8)
gtirb_build_gtbinary_macro()

set(_GENERATION_CONSTANT 16)
gtirb_build_gtbinary_macro()

set(_GENERATION_CONSTANT 32)
gtirb_build_gtbinary_macro()

set(_GENERATION_CONSTANT 64)
gtirb_build_gtbinary_macro()

# set(_GENERATION_CONSTANT 128) GTIRB_BUILD_GTBINARY_MACRO()

# set(_GENERATION_CONSTANT 256) GTIRB_BUILD_GTBINARY_MACRO()

# set(_GENERATION_CONSTANT 512) GTIRB_BUILD_GTBINARY_MACRO()


================================================
FILE: src/test/testInputBinary/TestInputBinary.cpp
================================================
//===- TestInputBinary.cpp --------------------------------------*- C++ -*-===//
//
//  Copyright (C) 2020 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//
///
/// \file 		TestInputBinary.cpp
///
/// References:
/// 	http://www.boost.org/doc/libs/1_66_0/libs/preprocessor/doc/index.html
///
/// Define GENERATION_CONSTANT to be between 1 and 65536.
///

#include <array>
#include <cstdint>
#include <cstdlib>
#include <exception>
#include <iostream>
#include <stdio.h>
#include <string>

/// Compute a factorial
int64_t Factorial(int64_t x) {
  if (x <= 0) {
    return 1;
  } else {
    return x * Factorial(x - 1);
  }
}

std::string IndirectFoo() { return "Foo"; }

std::string IndirectBar() { return "Bar"; }

const char* Index8[] = {"one",  "two", "three", "four",
                        "five", "six", "seven", "eight"};

template <int N, int I> class GeneratedClass {
public:
  GeneratedClass() { this->setName("GeneratedClass"); }

  /// Template function to print an integer.
  void printInteger() {
    std::cout << "Class<" << N << ", " << I << "> ";
    std::cout << "Factorial: !" << I << " = " << Factorial(I) << "; ";
    std::cout << "Throws: " << this->randomThrow() << "; ";
    std::cout << "Index: " << this->randomIndex() << "; ";
    std::cout << "Indirect: " << this->randomIndirect() << "; ";
    std::cout << "Member: " << this->member << "; ";
    std::cout << std::endl;
  }

  bool randomThrow() {
    this->setName("VOID");
    this->member += rand();

    try {
      if (rand() % 256 == 0) {
        throw std::logic_error("Ramdom Throw");
      }
    } catch (...) {
      return true;
    }

    return false;
  }

  std::string randomIndex() const { return std::string(Index8[rand() % 8]); }

  std::string randomIndirect() {
    this->member -= rand();

    if (rand() % 2 == 0) {
      return IndirectFoo();
    }

    return IndirectBar();
  }

  void operator()() {
    this->printInteger();

    // Generate small binaries.
    GeneratedClass<N - 1, I>()();

    // Generate much bigger binaries
    // GeneratedClass<N - 1, I + N>()();
    // GeneratedClass<N - 1, I - N>()();
  }

  void setName(const std::string& x) { this->name = x; }

private:
  std::string name;
  int64_t member{0};
};

// The "Exit" case for macro expansion.
template <int I> class GeneratedClass<0, I> {
public:
  void operator()() {
    // Empty
  }
};

int main() { GeneratedClass<GENERATION_CONSTANT, 0>()(); }


================================================
FILE: src/test/testInterop/CMakeLists.txt
================================================
set(PROJECT_NAME testInterop)

add_executable(test_floats test_floats.cpp)
add_executable(test_variants test_variants.cpp)
set_target_properties(test_floats PROPERTIES FOLDER "gtirb/test/testInterop")
set_target_properties(test_variants PROPERTIES FOLDER "gtirb/test/testInterop")

target_link_libraries(test_floats gtirb)
target_link_libraries(test_variants gtirb)

target_compile_definitions(test_floats PRIVATE GTIRB_WRAP_UTILS_IN_NAMESPACE)
target_compile_definitions(test_variants PRIVATE GTIRB_WRAP_UTILS_IN_NAMESPACE)

set(${PROJECT_NAME}_SCRIPTS test_floats.py test_variants.py)
set(test_floats ${CMAKE_BINARY_DIR}/bin/test_floats)

foreach(script_name ${${PROJECT_NAME}_SCRIPTS})
  configure_file(
    ${script_name} ${CMAKE_CURRENT_BINARY_DIR}/${script_name} @ONLY
  )
endforeach()


================================================
FILE: src/test/testInterop/test_floats.cpp
================================================
//===- test_floats.cpp ----------------------------------------------*- C++
//-*-===//
//
//  Copyright (C) 2021 GrammaTech, Inc.
//
//  This code is licensed under the MIT license. See the LICENSE file in the
//  project root for license terms.
//
//  This project is sponsored by the Office of Naval Research, One Liberty
//  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
//  N68335-17-C-0700.  The content of the information does not necessarily
//  reflect the position or policy of the Government and no official
//  endorsement should be inferred.
//
//===----------------------------------------------------------------------===//

#include <gtirb/gtirb.hpp>
#include <cstring>
#include <fstream>
#include <iostream>

struct AFloat {
  static constexpr const char* Name = "AFloat";
  typedef float Type;
};

struct ADouble {
  static constexpr const char* Name = "ADouble";
  typedef double Type;
};

void registerAuxData() {
  gtirb::AuxDataContainer::registerAuxDataType<AFloat>();
  gtirb::AuxDataContainer::registerAuxDataType<ADouble>();
};

int test_floats(const std::string& filename) {
  gtirb::Context C;
  std::ifstream inpt(filename, std::ios::binary);
  auto ir = gtirb::IR::load(C, inpt);
  if (ir) {
    auto f = (*ir)->getAuxData<AFloat>();
    auto g = (*ir)->getAuxData<ADouble>();
    if (f && g && (*f == 0.5) && (*g == 2.0)) {
      return 0;
    }
  }
  return 1;
}

void create_floats(const std::string& filename) {
  std::ofstream out(filename, std::ios::binary);
  gtirb::Context C;
  auto ir = gtirb::IR::Create(C);
  ir->addAuxData<AFloat>(0.5);
  ir->addAuxData<ADouble>(2.0);
  ir->save(out);
}

int usage(const char* argv0) {
  std::cout << "Usage: " << argv0 << " {-r filename | -w filename}\n";
  return -1;
}

int main(int argc, char** argv) {
  if (argc < 3)
    return usage(argv[0]);
  registerAuxData();
  if (strcmp("-w", argv[1]) == 0) {
    create_floats(argv[2]);
    return 0;
  } else if (strcmp("-r", argv[1]) == 0) {
    return test_floats(argv[2]);
  } else {
    return usage(argv[0]);
  }
}


================================================
FILE: src/test/testInterop/test_floats.py
================================================
# ===- test_floats.py ----------------------------------*- python -*-===//
#
#  Copyright (C) 2021 GrammaTech, Inc.
#
#  This code is licensed under the MIT license.
#  See the LICENSE file in the project root for license terms.
#
#  This project is sponsored by the Office of Naval Research, One Liberty
#  Center, 875 N. Randolph Street, Arlington, VA 22203 under contract #
#  N68335-17-C-0700.  The content of the information does not necessarily
#  reflect the position or policy of the Government and no official
#  endorsement should be inferred.
#
# ===-----------------------------------------------------------------===//

import argparse

import gtirb


def create_floats(filename: str):
    ir = gtirb.IR()
    ir.aux_data["AFloat"] = gtirb.AuxData(0.5, "float")
    ir.aux_data["ADouble"] = gtirb.AuxData(2.0, "double")
    ir.save_protobuf(filename)


def check_for_floats(filename: str) -> bool:
    ir = gtirb.IR.load_protobuf(filename)
    f = ir.aux_data["AFloat"]
    float_success = f.type_name == "float" and f.data == 0.5
    g = ir.aux_data["ADouble"]
    double_success = g.type_name == "double" and g.data == 2.0
    return float_success and double_success


parser = argparse.ArgumentParser()
parser.add_argument("-w", required=False, type=str)
parser.add_argument("-r", required=False, type=str)

if __name__ == "__main__":
    args = parser.parse_args()
    if args.w:
        create_floats(args.w)
    elif args.r:
        if check_for_floats(args.r):
            exit(0)
        else:
            exit(1)


================================================
FILE: src/test/testInterop/test_variants.cpp
================================================
#include <gtirb/gtirb.hpp>
#include <cstring>
#include <fstream>
#include <iostream>
#include <map>
#include <string>
#include <variant>

struct SimpleVariantMap {
  typedef std::map<uint32_t, std::variant<int32_t, std::string>> Type;
  static constexpr const char* Name = "simpleVariantMap";
};

struct ComplexVariantMap {
  typedef std::map<std::string, std::variant<int64_t, std::string, int64_t>>
      Type;
  static constexpr const char* Name = "complexVariantMap";
};

static const SimpleVariantMap::Type simpleMap{
    {1, 1}, {2, "a"}, {3, "z"}, {4, -1}};

typedef std::variant<int64_t, std::string, int64_t> Var;

static const ComplexVariantMap::Type complexMap{
    {"a", Var(std::in_place_index<0>, 1)},
    {"b", Var("hello")},
    {"c", Var(std::in_place_index<2>, 4)},
    {"d", Var(std::in_place_index<0>, 0)}};

void register_schema() {
  gtirb::AuxDataContainer::registerAuxDataType<SimpleVariantMap>();
  gtirb::AuxDataContainer::registerAuxDataType<ComplexVariantMap>();
}

void add_auxdata(gtirb::IR* Ir) {
  auto NewSimpleMap = simpleMap;
  auto NewComplexMap = complexMap;
  Ir->addAuxData<SimpleVariantMap>(std::move(NewSimpleMap));
  Ir->addAuxData<ComplexVariantMap>(std::move(NewComplexMap));
}

bool write_ir(const std::string& filename) {
  std::ofstream dest{filename};
  gtirb::Context Ctx;
  auto* Ir = gtirb::IR::Create(Ctx);
  if (!Ir)
    return 1;
  add_auxdata(Ir);
  Ir->save(dest);
  return 0;
}

bool check_ir(const std::string& filename) {
  std::ifstream Src{filename, std::ios::binary | std::ios::in};
  gtirb::Context Ctx;
  auto MaybeIR = gtirb::IR::load(Ctx, Src);
  if (!MaybeIR)
    return 1;
  auto* Ir = *MaybeIR;
  auto* NewSimpleMap = Ir->getAuxData<SimpleVariantMap>();
  if (!NewSimpleMap)
    return 1;
  auto* NewComplexMap = Ir->getAuxData<ComplexVariantMap>();
  if (!NewComplexMap)
    return 1;
  return 0;
}

int usage(const char* argv0) {
  std::cout << "Usage: " << argv0 << " {-r filename | -w filename}\n";
  return -1;
}

int main(int argc, char** argv) {
  if (argc < 3)
    return usage(argv[0]);
  register_schema();
  if (strcmp(argv[1], "-r") == 0)
    return check_ir(argv[2]);
  if (strcmp(argv[1], "-w") == 0)
    return write_ir(argv[2]);
  return usage(argv[0]);
}


================================================
FILE: src/test/testInterop/test_variants.py
================================================
import dataclasses
import os
import tempfile
from typing import Any, ClassVar

import gtirb


class V1(gtirb.Variant):
    type_list = [
        int,
        str,
    ]

    def __init__(self, val: Any):
        index = self.type_list.index(type(val))
        super().__init__(index, val)


def compare_variant_maps(m1, m2):
    assert not set(m1.keys()) ^ set(m2.keys())
    assert not set(v.val for v in m1.values()) ^ set(
        v.val for v in m2.values()
    )


def make_simple_variant_map():
    vmap = {1: V1(1), 2: V1("a"), 3: V1("z"), 4: V1(-1)}

    ad = gtirb.AuxData(vmap, "mapping<uint32_t,variant<int32_t,string>>")
    ir = gtirb.IR()
    ir.aux_data["simpleVariantMap"] = ad
    return ir, vmap


def test_mapvariant():
    ir, vmap = make_simple_variant_map()
    _, tmp = tempfile.mkstemp()
    try:
        ir.save_protobuf(tmp)
        ir2 = gtirb.IR.load_protobuf(tmp)
    finally:
        os.remove(tmp)
    ad2 = ir2.aux_data["simpleVariantMap"].data
    compare_variant_maps(ad2, vmap)


@dataclasses.dataclass
class I1:
    GTIRB_TYPE: ClassVar[str] = "int64_t"
    data: int


@dataclasses.dataclass
class I2:
    GTIRB_TYPE: ClassVar[str] = "int64_t"
    data: int


@dataclasses.dataclass
class S1:
    GTIRB_TYPE: ClassVar[str] = "string"
    data: str


@dataclasses.dataclass
class MyMap:
    TYPELIST = [
        I1,
        S1,
        I2,
    ]
    GTIRB_TYPE = "variant<" + ",".join(t.GTIRB_TYPE for t in TYPELIST) + ">"

    def __init__(self, map_) -> None:
        self._map = map_

    def __eq__(self, __o: object) -> bool:
        if not isinstance(__o, MyMap):
            return False
        return self._map == __o._map

    def __repr__(self) -> str:
        return f"MyMap({self._map!r})"

    def toAuxData(self):
        return {
            k: gtirb.Variant(self.TYPELIST.index(type(v)), v.data)
            for k, v in self._map.items()
        }

    @classmethod
    def fromAuxData(cls, auxdata: gtirb.AuxData):
        if not isinstance(auxdata.data, dict):
            raise Exception()
        newmap = dict()
        for (k, v) in auxdata.data.items():
            newmap[k] = cls.TYPELIST[v.index](v.val)
        return cls(newmap)


def make_complex_variant_map():
    variant_map = MyMap({"a": I1(1), "b": S1("hello"), "c": I2(4), "d": I1(0)})

    ad = gtirb.AuxData(
        data=variant_map.toAuxData(),
        type_name=f"mapping<string,{MyMap.GTIRB_TYPE}>",
    )
    ir = gtirb.IR()
    ir.aux_data["complexVariantMap"] = ad
    return ir, variant_map


def test_complex_variant_map():
    ir, variant_map = make_complex_variant_map()
    _, tmp = tempfile.mkstemp()
    try:
        ir.save_protobuf(tmp)
        ir2 = gtirb.IR.load_protobuf(tmp)
    finally:
        os.remove(tmp)
    ad2 = MyMap.fromAuxData(ir2.aux_data["complexVariantMap"])
    assert ad2 == variant_map


def write_ir(filename):
    ir, _ = make_simple_variant_map()
    ir2, _ = make_complex_variant_map()
    ir.aux_data["complexVariantMap"] = ir2.aux_data["complexVariantMap"]
    ir.save_protobuf(filename)


def check_ir(filename):
    ir = gtirb.IR.load_protobuf(filename)
    _, simple = make_simple_variant_map()
    compare_variant_maps(ir.aux_data["simpleVariantMap"].data, simple)
    my_map = MyMap.fromAuxData(ir.aux_data["complexVariantMap"])
    _, my_other_map = make_complex_variant_map()
    assert my_other_map == my_map, (my_other_map, my_map)


if __name__ == "__main__":
    import argparse

    parser = argparse.ArgumentParser()
    parser.add_argument("-r")
    parser.add_argument("-w")
    args = parser.parse_args()

    if args.r:
        check_ir(args.r)

    if args.w:
        write_ir(args.w)


================================================
FILE: version.txt
================================================
VERSION_MAJOR 2
VERSION_MINOR 3
VERSION_PATCH 2
VERSION_PROTOBUF 4