Repository: nanoporetech/pod5-file-format
Branch: master
Commit: 6356e5c97b36
Files: 297
Total size: 2.3 MB

Directory structure:
gitextract_n9lck0re/

├── .clang-format
├── .codespellrc
├── .flake8
├── .gitattributes
├── .github/
│   └── ISSUE_TEMPLATE/
│       └── bug_report.md
├── .gitignore
├── .gitlab-ci.yml
├── .gitmodules
├── .pre-commit-config.yaml
├── .readthedocs.yaml
├── CHANGELOG.md
├── CMakeLists.txt
├── CMakePresets.json
├── DEV.md
├── LICENSE.md
├── README.md
├── benchmarks/
│   ├── .gitignore
│   ├── README.md
│   ├── build.sh
│   ├── convert/
│   │   ├── run_blow5.sh
│   │   └── run_pod5.sh
│   ├── find_all_read_ids/
│   │   ├── run_blow5.sh
│   │   ├── run_fast5.sh
│   │   └── run_pod5.sh
│   ├── find_all_samples/
│   │   ├── run_blow5.sh
│   │   ├── run_fast5.sh
│   │   └── run_pod5.sh
│   ├── find_selected_read_ids_read_number/
│   │   ├── run_blow5.sh
│   │   ├── run_fast5.sh
│   │   └── run_pod5.sh
│   ├── find_selected_read_ids_sample_count/
│   │   ├── run_blow5.sh
│   │   ├── run_fast5.sh
│   │   └── run_pod5.sh
│   ├── find_selected_read_ids_samples/
│   │   ├── run_blow5.sh
│   │   ├── run_fast5.sh
│   │   └── run_pod5.sh
│   ├── image/
│   │   ├── Dockerfile.base
│   │   ├── install_slow5.sh
│   │   └── requirements-benchmarks.txt
│   ├── run_benchmarks.py
│   ├── run_benchmarks_in_docker.sh
│   └── tools/
│       ├── check_csvs_consistent.py
│       ├── fast5_to_single_blow5.sh
│       ├── find_and_get_fast5.py
│       ├── find_and_get_pod5.py
│       ├── pyslow5_tests.py
│       ├── run_benchmarks_docker_entry.sh
│       └── select-random-ids.py
├── c++/
│   ├── CMakeLists.txt
│   ├── examples/
│   │   ├── CMakeLists.txt
│   │   ├── README.md
│   │   ├── find_all_read_data.cpp
│   │   ├── find_all_read_ids.cpp
│   │   ├── find_specific_read_ids.cpp
│   │   └── find_specific_read_ids_with_signal.cpp
│   ├── pod5_format/
│   │   ├── async_signal_loader.cpp
│   │   ├── async_signal_loader.h
│   │   ├── c_api.cpp
│   │   ├── c_api.h
│   │   ├── dictionary_writer.h
│   │   ├── expandable_buffer.h
│   │   ├── file_output_stream.h
│   │   ├── file_reader.cpp
│   │   ├── file_reader.h
│   │   ├── file_recovery.h
│   │   ├── file_updater.cpp
│   │   ├── file_updater.h
│   │   ├── file_writer.cpp
│   │   ├── file_writer.h
│   │   ├── flatbuffers/
│   │   │   └── footer.fbs
│   │   ├── internal/
│   │   │   ├── async_output_stream.h
│   │   │   ├── combined_file_utils.h
│   │   │   ├── linux_output_stream.h
│   │   │   └── tracing/
│   │   │       └── tracing.h
│   │   ├── io_manager.cpp
│   │   ├── io_manager.h
│   │   ├── memory_pool.cpp
│   │   ├── memory_pool.h
│   │   ├── migration/
│   │   │   ├── migration.cpp
│   │   │   ├── migration.h
│   │   │   ├── migration_utils.h
│   │   │   ├── v0_to_v1.cpp
│   │   │   ├── v1_to_v2.cpp
│   │   │   ├── v2_to_v3.cpp
│   │   │   └── v3_to_v4.cpp
│   │   ├── read_table_reader.cpp
│   │   ├── read_table_reader.h
│   │   ├── read_table_schema.cpp
│   │   ├── read_table_schema.h
│   │   ├── read_table_utils.cpp
│   │   ├── read_table_utils.h
│   │   ├── read_table_writer.cpp
│   │   ├── read_table_writer.h
│   │   ├── read_table_writer_utils.cpp
│   │   ├── read_table_writer_utils.h
│   │   ├── result.h
│   │   ├── run_info_table_reader.cpp
│   │   ├── run_info_table_reader.h
│   │   ├── run_info_table_schema.cpp
│   │   ├── run_info_table_schema.h
│   │   ├── run_info_table_writer.cpp
│   │   ├── run_info_table_writer.h
│   │   ├── schema_field_builder.h
│   │   ├── schema_metadata.cpp
│   │   ├── schema_metadata.h
│   │   ├── schema_utils.cpp
│   │   ├── schema_utils.h
│   │   ├── signal_builder.h
│   │   ├── signal_compression.cpp
│   │   ├── signal_compression.h
│   │   ├── signal_table_reader.cpp
│   │   ├── signal_table_reader.h
│   │   ├── signal_table_schema.cpp
│   │   ├── signal_table_schema.h
│   │   ├── signal_table_utils.h
│   │   ├── signal_table_writer.cpp
│   │   ├── signal_table_writer.h
│   │   ├── svb16/
│   │   │   ├── common.hpp
│   │   │   ├── decode.hpp
│   │   │   ├── decode_scalar.hpp
│   │   │   ├── decode_x64.hpp
│   │   │   ├── encode.hpp
│   │   │   ├── encode_scalar.hpp
│   │   │   ├── encode_x64.hpp
│   │   │   ├── generate_shuffle_tables.py
│   │   │   ├── intrinsics.hpp
│   │   │   ├── shuffle_tables.hpp
│   │   │   ├── simd_detect_x64.hpp
│   │   │   ├── streamvbytedelta_decode_16.c
│   │   │   ├── streamvbytedelta_encode_16.c
│   │   │   ├── streamvbytedelta_x64_decode_16.c
│   │   │   ├── streamvbytedelta_x64_encode_16.c
│   │   │   ├── svb16.c
│   │   │   └── svb16.h
│   │   ├── table_reader.cpp
│   │   ├── table_reader.h
│   │   ├── thread_pool.cpp
│   │   ├── thread_pool.h
│   │   ├── tuple_utils.h
│   │   ├── types.cpp
│   │   ├── types.h
│   │   ├── uuid.h
│   │   └── version.h.in
│   ├── pod5_format_pybind/
│   │   ├── CMakeLists.txt
│   │   ├── _version.py.in
│   │   ├── api.h
│   │   ├── bindings.cpp
│   │   ├── build_wheel.cmake
│   │   ├── repack/
│   │   │   ├── repack_functions.h
│   │   │   ├── repack_output.cpp
│   │   │   ├── repack_output.h
│   │   │   ├── repack_states.h
│   │   │   ├── repack_utils.h
│   │   │   ├── repacker.cpp
│   │   │   └── repacker.h
│   │   ├── subset.cpp
│   │   ├── subset.h
│   │   └── utils.h
│   └── test/
│       ├── CMakeLists.txt
│       ├── TemporaryDirectory.h
│       ├── c_api_build_test.c
│       ├── c_api_null_input.cpp
│       ├── c_api_test_utils.h
│       ├── c_api_tests.cpp
│       ├── file_reader_writer_tests.cpp
│       ├── main.cpp
│       ├── output_stream_tests.cpp
│       ├── read_table_tests.cpp
│       ├── read_table_writer_utils_tests.cpp
│       ├── run_info_table_tests.cpp
│       ├── schema_tests.cpp
│       ├── signal_compression_tests.cpp
│       ├── signal_table_tests.cpp
│       ├── svb16_scalar_tests.cpp
│       ├── svb16_x64_tests.cpp
│       ├── test_utils.h
│       ├── thread_pool_tests.cpp
│       ├── utils.h
│       └── uuid_tests.cpp
├── ci/
│   ├── docker/
│   │   ├── Dockerfile.conda
│   │   ├── Dockerfile.py39.arm64
│   │   └── Dockerfile.py39.x64
│   ├── generate_coverage_report.sh
│   ├── get_tag_version.cmake
│   ├── gitlab-ci-common.yml
│   ├── install.sh
│   ├── package.sh
│   └── unpack_libs_for_python.sh
├── cmake/
│   ├── BuildFlatBuffers.cmake
│   ├── Findzstd.cmake
│   ├── conan_provider.cmake
│   ├── pod5_fuzz.cmake
│   ├── pod5_packaging.cmake
│   └── presets/
│       ├── conan-build-options.json
│       ├── conan-profiles.json
│       └── conan-provider.json
├── conanfile.py
├── docs/
│   ├── DESIGN.md
│   ├── README.md
│   ├── SPECIFICATION.md
│   └── tables/
│       ├── reads.toml
│       ├── run_info.toml
│       └── signal.toml
├── fuzz/
│   ├── .gitattributes
│   ├── CMakeLists.txt
│   ├── fuzz_compress.cpp
│   ├── fuzz_file.cpp
│   └── runner.cpp
├── pod5_make_version.py
├── pyproject.toml
├── pytest.ini
├── python/
│   ├── .gitignore
│   ├── lib_pod5/
│   │   ├── Makefile
│   │   ├── README.md
│   │   ├── pyproject.toml
│   │   ├── setup.py
│   │   └── src/
│   │       ├── lib_pod5/
│   │       │   ├── __init__.py
│   │       │   ├── pod5_format_pybind.pyi
│   │       │   └── py.typed
│   │       └── test/
│   │           └── test_lib_pod5.py
│   └── pod5/
│       ├── Makefile
│       ├── README.md
│       ├── examples/
│       │   ├── find_all_reads.py
│       │   └── find_specific_reads.py
│       ├── pyproject.toml
│       ├── setup.py
│       ├── src/
│       │   ├── pod5/
│       │   │   ├── __init__.py
│       │   │   ├── api_utils.py
│       │   │   ├── dataset.py
│       │   │   ├── pod5_types.py
│       │   │   ├── reader.py
│       │   │   ├── repack.py
│       │   │   ├── signal_tools.py
│       │   │   ├── tools/
│       │   │   │   ├── __init__.py
│       │   │   │   ├── main.py
│       │   │   │   ├── parsers.py
│       │   │   │   ├── pod5_convert_from_fast5.py
│       │   │   │   ├── pod5_convert_to_fast5.py
│       │   │   │   ├── pod5_filter.py
│       │   │   │   ├── pod5_inspect.py
│       │   │   │   ├── pod5_merge.py
│       │   │   │   ├── pod5_recover.py
│       │   │   │   ├── pod5_repack.py
│       │   │   │   ├── pod5_subset.py
│       │   │   │   ├── pod5_update.py
│       │   │   │   ├── pod5_view.py
│       │   │   │   ├── polars_utils.py
│       │   │   │   └── utils.py
│       │   │   └── writer.py
│       │   └── tests/
│       │       ├── __init__.py
│       │       ├── conftest.py
│       │       ├── test_api.py
│       │       ├── test_convert_from_fast5.py
│       │       ├── test_convert_to_fast5.py
│       │       ├── test_dataset.py
│       │       ├── test_filter.py
│       │       ├── test_inspect.py
│       │       ├── test_merge.py
│       │       ├── test_reader.py
│       │       ├── test_recover.py
│       │       ├── test_repack.py
│       │       ├── test_signal_tools.py
│       │       ├── test_subset.py
│       │       ├── test_tools.py
│       │       ├── test_update.py
│       │       ├── test_view.py
│       │       └── test_writer.py
│       └── test_utils/
│           └── check_pod5_files_equal.py
├── test_data/
│   ├── multi_fast5_zip.fast5
│   ├── multi_fast5_zip_v0.pod5
│   ├── multi_fast5_zip_v1.pod5
│   ├── multi_fast5_zip_v2.pod5
│   ├── multi_fast5_zip_v3.pod5
│   ├── multi_fast5_zip_v4.pod5
│   ├── single_read_fast5/
│   │   └── fe85b517-62ee-4a33-8767-41cab5d5ab39.fast5.single-read
│   ├── split_1_v4.pod5
│   ├── split_2_v4.pod5
│   └── subset_mapping_examples/
│       ├── read_ids.txt
│       ├── subset.csv
│       └── subset.summary
├── test_package/
│   ├── CMakeLists.txt
│   ├── conanfile.py
│   ├── test_cpp_api.cpp
│   └── test_package.cpp
└── third_party/
    ├── build_instructions.txt
    ├── gsl-disable-gsl-suppress.patch
    ├── include/
    │   ├── .editorconfig
    │   ├── catch2/
    │   │   └── catch.hpp
    │   ├── gsl/
    │   │   ├── gsl
    │   │   ├── gsl-lite-vc6.hpp
    │   │   ├── gsl-lite.h
    │   │   └── gsl-lite.hpp
    │   └── gsl.h
    ├── jsoncons-0.166-icc-fix.patch
    ├── licenses/
    │   ├── catch2.txt
    │   └── gsl-lite.txt
    └── software_versions.yaml

================================================
FILE CONTENTS
================================================

================================================
FILE: .clang-format
================================================
---
# See https://releases.llvm.org/14.0.0/tools/clang/docs/ClangFormatStyleOptions.html
BasedOnStyle: Chromium
AccessModifierOffset: -4
AlignAfterOpenBracket: AlwaysBreak
# AlignArrayOfStructures can cause crashes, see https://github.com/llvm/llvm-project/issues/55269
#AlignArrayOfStructures: Left
AllowAllParametersOfDeclarationOnNextLine: false
AllowShortBlocksOnASingleLine: Empty
AllowShortFunctionsOnASingleLine: All
BinPackArguments: false
BinPackParameters: false
BreakBeforeBinaryOperators: NonAssignment
BreakBeforeBraces: Custom
BraceWrapping:
  # NB: due to https://github.com/llvm/llvm-project/issues/55582 the Multiline setting will not
  # always work (should be fixed in clang-format 15, but that is not available as a python wheel yet
  # due to https://github.com/ssciwr/clang-format-wheel/issues/49)
  AfterControlStatement: MultiLine # makes sure multiline ifs don't run into their bodies
  AfterFunction: true # makes constructors with initialisers much nicer
BreakBeforeConceptDeclarations: true
BreakBeforeTernaryOperators: true
BreakConstructorInitializers: BeforeComma
BreakStringLiterals: true
ColumnLimit: 100
CompactNamespaces: true
ConstructorInitializerIndentWidth: 0
ContinuationIndentWidth: 4
Cpp11BracedListStyle: true
DerivePointerAlignment: false # force use of the PointerAlignment setting
FixNamespaceComments: true
IncludeBlocks : Regroup
IncludeCategories:
  # Aim is:
  # 0. the "main" header file (#include "foo.h" in foo.cpp) automatically gets priority 0
  # 1. internal headers (#include "util/helpers.h"): quotation marks, with a '/'
  # 2. third-party headers (#include <arrow/status.h>): angle brackets, '/' or .h/.hpp/.h++
  #    file ext
  # 3. standard library headers (#include <vector>): angle brackets, no file ext, no '/'
  - Regex:    '^"'
    Priority: 1
  - Regex:    '^<.*/'
    Priority: 2
  - Regex:    '\.h>'
    Priority: 2
  - Regex:    '\.hpp>'
    Priority: 2
  - Regex:    '\.h\+\+>'
    Priority: 2
IncludeIsMainRegex: '(_test|_tests|Tests|Test)?$'
  # foo.h will be considered the "main" header (and sorted to the top) for all of the following:
  # - foo.cpp
  # - foo_test.cpp
  # - foo_tests.cpp
  # - fooTests.cpp (although this is intended for Foo.h and FooTests.cpp)
  # - fooTest.cpp (although this is intended for Foo.h and FooTest.cpp)
IndentCaseLabels: false
IndentWidth: 4
InsertBraces: true
PackConstructorInitializers: CurrentLine
PointerAlignment: Middle
QualifierAlignment: Right # const east
# clang 14 *should* know about QualifierOrder (according to its docs) but claims it doesn't
#QualifierOrder: ['static', 'constexpr', 'inline', 'type', 'const', 'volatile', 'restrict']
ReflowComments: false
SeparateDefinitionBlocks: Always
SortIncludes: CaseInsensitive
SortUsingDeclarations: true
SpaceAroundPointerQualifiers: Before
Standard: c++20


================================================
FILE: .codespellrc
================================================
# Waiting for pyproject.toml support: https://github.com/codespell-project/codespell/issues/2055

[codespell]
# "write-changes" doesn't work with "ignore-regex"
# https://github.com/codespell-project/codespell/issues/2056
# comma-separated list of built-in dictionaries (default is "clear,rare")
builtin = clear,rare,code
# show the line in which the error occurred
context = 0
# these options are turned on by specifying them here
check-filenames =
check-hidden =
enable-colors =
# split words on underscores
# e.g. "foo_bar" is split into two words ("foo", "bar") instead of one word ("foo_bar")
ignore-regex = _
# comma-separated list of false positives
ignore-words-list = iff,inout,befores,deque,stdio,O_WRONLY,wronly,sv_lite,lite,creat,arange
# comma-separated list of globs of files not to check
skip = .gitignore,.codespellrc


================================================
FILE: .flake8
================================================
# Waiting for pyproject.toml support: https://gitlab.com/pycqa/flake8/-/issues/428

[flake8]
extend-ignore = E203, W503
max-line-length = 120
per-file-ignores = __init__.py:F401, __init__.py:F403


================================================
FILE: .gitattributes
================================================
# Based on https://github.com/alexkaratarakis/gitattributes
# Auto detect text files and force linux-style line endings
*     text=auto eol=lf
# Documents
*.bibtex   text diff=bibtex
*.doc      diff=astextplain
*.DOC      diff=astextplain
*.docx     diff=astextplain
*.DOCX     diff=astextplain
*.dot      diff=astextplain
*.DOT      diff=astextplain
*.pdf      diff=astextplain
*.PDF      diff=astextplain
*.rtf      diff=astextplain
*.RTF      diff=astextplain
*.md       text diff=markdown
*.mdx      text diff=markdown
*.tex      text diff=tex
*.adoc     text
*.textile  text
*.mustache text
*.csv      text
*.tab      text
*.tsv      text
*.txt      text
*.sql      text
*.epub     diff=astextplain
# Graphics
*.png      binary
*.jpg      binary
*.jpeg     binary
*.gif      binary
*.tif      binary
*.tiff     binary
*.ico      binary
*.svg      binary
*.eps      binary
*.bash     text
*.fish     text
*.sh       text
*.zsh      text
# These are explicitly windows files and should use crlf
*.bat      text eol=crlf
*.cmd      text eol=crlf
*.ps1      text eol=crlf
# Serialisation
*.json     text
*.toml     text
*.xml      text
*.yaml     text
*.yml      text
# Archives
*.7z       binary
*.gz       binary
*.tar      binary
*.tgz      binary
*.zip      binary
# Text files where line endings should be preserved
*.diff     -text
*.patch    -text
# Exclude git(lab)-specific files when making an archive of the source tree
.gitattributes          export-ignore
.gitignore              export-ignore
.gitkeep                export-ignore
.git-blame-ignore-revs  export-ignore
.gitlab-ci.yml          export-ignore
/ci                     export-ignore
# C++ Sources
*.c        text diff=cpp
*.cc       text diff=cpp
*.cxx      text diff=cpp
*.cpp      text diff=cpp
*.c++      text diff=cpp
*.hpp      text diff=cpp
*.h        text diff=cpp
*.h++      text diff=cpp
*.hh       text diff=cpp
# Read formats
*.pod5 filter=lfs diff=lfs merge=lfs -text
*.fast5    binary


================================================
FILE: .github/ISSUE_TEMPLATE/bug_report.md
================================================
---
name: Bug report
about: Create a report to help us improve
title: ''
labels: ''
assignees: ''

---

## Issue Description

> Please provide a description of your issue and include any commands used to reproduce the issue.

## Logs

> Please provide any log files. These can be generated by setting the `POD5_DEBUG` environment variable e.g. `POD5_DEBUG=1 pod5 view my.pod5`

## Specifications

- Pod5 Version:
- Python Version:
- Platform:


================================================
FILE: .gitignore
================================================
build*/
.conan/
cmake-build*/
CMakeUserPresets.json
_build/
.conan/
.cache/
dist/
.DS_Store
.pod5
venv/
*.venv/
uv.lock
docs/public/
.tmp_pod5*
_version.py
*egg-info/
POD5Version.cmake
*.swp
test_package/CMakeUserPresets.json
.vscode/
.devcontainer/
__pycache__
python/Python.framework/
/fuzz/corpus_*


================================================
FILE: .gitlab-ci.yml
================================================
stages:
  - .pre
  - build
  - test
  - build-conan
  - archive
  - deploy

include:
    - local: '/ci/gitlab-ci-common.yml'

variables:
  GIT_SUBMODULE_STRATEGY: recursive
  STABLE_BRANCH_NAME: master
  DO_UPLOAD: "yes" # Always upload in conan upload jobs (only run on tags)
  CONAN_PROFILE_BUILD_TYPE: Release
  CONAN_VENV_PYTHON: "3.13"
  CMAKE_VERSION: "4.2.3"
before_script:
  - ""

# The versions that we build and test.
.parallel-py-versions:
  parallel:
    matrix:
      - PYTHON_VERSION: ["3.10", "3.11", "3.12", "3.13", "3.14"]


# ======================================
#
#     Docker
#
# ======================================


.build-docker-image:
  stage: .pre
  image: ${CI_REGISTRY}/traque/ont-docker-base/ont-base-docker:latest
  before_script:
    - docker login --username ${CI_REGISTRY_USER} --password ${CI_REGISTRY_PASSWORD} ${CI_REGISTRY}
  when: manual
  retry:
    max: 2
    when: runner_system_failure
  script:
    - tag="${CI_REGISTRY_IMAGE}/${IMAGE_TAG}"
    - docker image build --pull --target "${PLATFORM}"
                         --tag "${tag}" --file ${DOCKERFILE} ci/docker
    - docker image push ${tag}

docker base aarch64:
  tags:
    - docker-builder-arm
  extends:
    - .build-docker-image
  variables:
    IMAGE_TAG: "build-arm64"
    DOCKERFILE: "ci/docker/Dockerfile.py39.arm64"

docker base x86-64:
  tags:
    - docker-builder
  extends:
    - .build-docker-image
  variables:
    IMAGE_TAG: "build-x64"
    DOCKERFILE: "ci/docker/Dockerfile.py39.x64"

docker conda:
  tags:
    - docker-builder
  extends:
    - .build-docker-image
  variables:
    IMAGE_TAG: "conda"
    DOCKERFILE: "ci/docker/Dockerfile.conda"


.docker template:
  stage: docker
  image: ${CI_REGISTRY}/traque/ont-docker-base/ont-base-docker:latest
  before_script:
    - docker login --username ${CI_REGISTRY_USER} --password ${CI_REGISTRY_PASSWORD} ${CI_REGISTRY}
  retry:
    max: 2
    when: runner_system_failure

# ======================================
#
#     Versioning
#
# ======================================

prepare_version:
  stage: .pre
  image: ${CI_REGISTRY}/traque/ont-docker-base/ont-base-python:3.10
  script:
    - git tag -d $(git tag -l "*a*")
    - git tag -d $(git tag -l "*b*")
    - git tag -d $(git tag -l "*r*")
    - git tag -d $(git tag -l "*c*")
    - git tag -d $(git tag -l "*dev*")
    - if [[ ${CI_COMMIT_TAG/#v/} && -z $( git tag -l "${CI_COMMIT_TAG/#v/}" ) ]]; then git tag ${CI_COMMIT_TAG/#v/}; fi
    - pip install --upgrade pip setuptools_scm~=7.1
    - apt update && apt install -y git-lfs
    - git status --porcelain
    - python -m setuptools_scm
    - cat _version.py
    # Show the version that will be used in the pod5/pyproject.toml
    - VERSION=$(grep "__version__" _version.py | awk '{print $5}' | tr -d "'" | cut -d'+' -f1)
    - echo $VERSION
    - python -m pod5_make_version
    - cat cmake/POD5Version.cmake
    - cat _version.py python/lib_pod5/src/lib_pod5/_version.py
    - cat _version.py python/pod5/src/pod5/_version.py
  artifacts:
    name: "${CI_JOB_NAME}-artifacts"
    paths:
      - "cmake/POD5Version.cmake"
      - "_version.py"
      - "python/lib_pod5/src/lib_pod5/_version.py"
      - "python/pod5/src/pod5/_version.py"


# ======================================
#
#     Pre-Flight Setup / Checks
#
# ======================================

tag_version_check:
  stage: .pre
  needs:
    - "prepare_version"
  only:
    - tags
  image: ${CI_REGISTRY}/minknow/images/build-x86_64-gcc13:latest
  script:
    - uv venv .venv
    - source .venv/bin/activate
    - uv pip install "cmake==${CMAKE_VERSION}"
    - pod5_version="$(cmake -P ci/get_tag_version.cmake 2>&1)"
    - tag_version="${CI_COMMIT_TAG/#v/}"
    - if [[ "${pod5_version}" != "${tag_version}" ]]; then
        echo "Tag is for release ${tag_version}, but POD5 version is $pod5_version";
        exit 1;
      fi

api_lib_version_check:
  stage: .pre
  needs:
    - "prepare_version"
  image: ${CI_REGISTRY}/minknow/images/build-x86_64-gcc13:latest
  script:
    - cat _version.py
    - NO_DEV_VERSION=$(grep "__version__" _version.py | awk '{print $5}' | tr -d "'" | cut -d'+' -f1 | sed 's/\([0-9]\+\.[0-9]\+\.[0-9]\+\).*$/\1/')
    - echo $NO_DEV_VERSION
    - cat python/pod5/pyproject.toml
    - echo "If this jobs fails then we have forgotten to match the api and lib version in the api python/pod5/pyproject.toml"
    - grep "lib_pod5\s*==\s*$NO_DEV_VERSION" python/pod5/pyproject.toml


pre-commit checks:
    image: ${CI_REGISTRY}/traque/ont-docker-base/ont-base-python:3.10
    stage: .pre
    tags:
        - linux_x86
        - docker
    script:
        - pip install pre-commit
        - if ! pre-commit run --all-files; then
        -   cat "${PRE_COMMIT_HOME}/pre-commit.log"
        - >-
            if grep -F -q \
              -e "InvalidManifestError" \
              -e "error: [Errno 17] File exists: 'build/temp.linux-x86_64-cpython-" \
              "${PRE_COMMIT_HOME}/pre-commit.log"; then
        -     echo "Bad cache state detected, deleting cache and re-running"
        -     rm -rf "${PRE_COMMIT_HOME}/"
        -     pre-commit run --all-files
        -   else
        -     exit 1
        -   fi
        - fi
    after_script:
        - cat "${PRE_COMMIT_HOME}/pre-commit.log" || true
    variables:
        PRE_COMMIT_HOME: ${CI_PROJECT_DIR}/.cache/pre-commit
    cache:
        paths:
            - ${PRE_COMMIT_HOME}


# ======================================
#
#     Build Lib Standalone
#
# ======================================


build-standalone-ubu22:
  stage: build
  image: external-docker.artifactory.oxfordnanolabs.local/ubuntu:22.04
  needs:
    - "prepare_version"
  script:
    - export DEBIAN_FRONTEND=noninteractive
    - apt-get update
    - apt-get install -y -V ca-certificates lsb-release wget
    - wget https://apache.jfrog.io/artifactory/arrow/$(lsb_release --id --short | tr 'A-Z' 'a-z')/apache-arrow-apt-source-latest-$(lsb_release --codename --short).deb
    - apt-get install -y -V ./apache-arrow-apt-source-latest-$(lsb_release --codename --short).deb
    - apt-get update
    - apt-get install -y cmake build-essential libzstd-dev libzstd-dev libflatbuffers-dev libarrow-dev=18.0.0-1
    - mkdir -p build
    - cd build
    - cmake
      -D POD5_DISABLE_TESTS=OFF
      -D POD5_BUILD_EXAMPLES=ON
      -D BUILD_PYTHON_WHEEL=OFF
      ..
    - cmake --build . --parallel
    - ctest -C Release -VV


# ======================================
#
#     Build helpers
#
# ======================================


# Takes CMAKE_ARGS, AUDITWHEEL_PLATFORM, and PYTHON_VERSION.
.conan-build-and-test:
  - |
  - export TOOLCHAIN_FILE=build/generators/conan_toolchain.cmake
  - pod5_version="$(cmake -P ci/get_tag_version.cmake 2>&1)"
  - mkdir -p build
  - cd build
  - ${conan_exe} install --profile ${CONAN_PROFILE} ${EXTRA_INSTALL_ARGS} ..
  - cmake ${CMAKE_ARGS}
    -D BUILD_SHARED_LIB=ON
    -D CMAKE_BUILD_TYPE=Release
    -D POD5_DISABLE_TESTS=OFF
    -D POD5_BUILD_EXAMPLES=ON
    -D BUILD_PYTHON_WHEEL=OFF
    -D CMAKE_TOOLCHAIN_FILE=${TOOLCHAIN_FILE}
    ..
  - cmake --build . --config Release --parallel
  - ctest -C Release -VV
  - ../ci/install.sh
  - cmake ${CMAKE_ARGS}
    -D BUILD_SHARED_LIB=OFF
    -D CMAKE_BUILD_TYPE=Release
    -D POD5_DISABLE_TESTS=OFF
    -D POD5_BUILD_EXAMPLES=ON
    -D BUILD_PYTHON_WHEEL=ON
    -D PYTHON_VERSION=${PYTHON_VERSION}
    -D CMAKE_TOOLCHAIN_FILE=${TOOLCHAIN_FILE}
    ..
  - cmake --build . --config Release --parallel
  - ctest -C Release -VV
  - ../ci/install.sh STATIC_BUILD
  - ../ci/package.sh ${OUTPUT_SKU} ${AUDITWHEEL_PLATFORM}


# ======================================
#
#     Build Lib Linux
#
# ======================================


.build-linux:
  stage: build
  needs:
    - "prepare_version"
  variables:
    EXTRA_INSTALL_ARGS: "-o arrow:with_boost=False -o arrow:with_thrift=False -o arrow:parquet=False"
  before_script:
    - /opt/python/cp310-cp310/bin/pip install -U pip 'conan<2' auditwheel build "cmake==${CMAKE_VERSION}"
    - ln -n /opt/python/cp310-cp310/bin/auditwheel /usr/bin/auditwheel
    - ln -n /opt/python/cp310-cp310/bin/conan /usr/bin/conan
    - conan config install --verify-ssl=no ${CONAN_CONFIG_URL}
    - conan_exe=$(which conan)
  script:
    - !reference [".conan-build-and-test"]
  artifacts:
    name: "${CI_JOB_NAME}-artifacts"
    paths:
      - "lib_pod5*.tar.gz"
      - "lib_pod5*.whl"

linux-x64-gcc9-release-build:
  image: external-quay.artifactory.oxfordnanolabs.local/pypa/manylinux2014_x86_64
  extends:
    - .build-linux
    - .parallel-py-versions
  tags:
    - linux
  variables:
    CONAN_PROFILE: "linux-x86_64-gcc9.jinja"
    CONAN_PROFILE_CPPSTD: 17
    OUTPUT_SKU: "linux-x64"
    AUDITWHEEL_PLATFORM: manylinux2014_x86_64

linux-aarch64-gcc9-release-build:
  image: external-quay.artifactory.oxfordnanolabs.local/pypa/manylinux2014_aarch64
  extends:
    - .build-linux
    - .parallel-py-versions
  tags:
    - linux_aarch64
    - high-cpu
  variables:
    CONAN_PROFILE: "linux-aarch64-gcc9.jinja"
    CONAN_PROFILE_CPPSTD: 17
    OUTPUT_SKU: "linux-arm64"
    AUDITWHEEL_PLATFORM: manylinux2014_aarch64


# ======================================
#
#     Build Lib OSX
#
# ======================================


.build-osx-common:
  stage: build
  needs:
    - "prepare_version"
  variables:
    EXTRA_INSTALL_ARGS: "-o arrow:with_boost=False -o arrow:with_thrift=False -o arrow:parquet=False"
  before_script:
    - uv venv .venv_conan --python ${CONAN_VENV_PYTHON} --seed
    - source .venv_conan/bin/activate
    # Note that cmake 3.31+ do not work properly on macOS 14 (and earlier)
    # Pinning to 3.30 avoid SSL issues when connecting to internal servers
    - uv pip install -U pip 'conan<2' 'cmake==3.30.9'
    - conan config install --verify-ssl=no "${CONAN_CONFIG_URL}"
    - conan_exe=$(which conan)
    - uv python install ${PYTHON_VERSION}
    - uv venv --python "python${PYTHON_VERSION}" .venv --seed
    - source .venv/bin/activate
    - which python
    - python --version
  script:
    - python3 -c "import sysconfig; print(sysconfig.get_platform())"
    - !reference [".conan-build-and-test"]
  artifacts:
    name: "${CI_JOB_NAME}-artifacts"
    paths:
      - "lib_pod5*.tar.gz"
      - "lib_pod5*.whl"

osx-arm64-clang15-release-build:
  extends:
    - .build-osx-common
    - .parallel-py-versions
  tags:
    - osx_arm64
    - xcode-15.3
    - conan
  variables:
    CONAN_PROFILE: "macos-aarch64-appleclang-15.0.jinja"
    CONAN_PROFILE_CPPSTD: 20
    CMAKE_ARGS: "-DCMAKE_OSX_ARCHITECTURES=arm64"
    MACOSX_DEPLOYMENT_TARGET: "14.0"
    OUTPUT_SKU: "osx-14.0-arm64"
    FORCE_PYTHON_PLATFORM: macosx_14_0_arm64


# ======================================
#
#     Build Lib Windows
#
# ======================================


.build-win-common:
  stage: build
  needs:
    - "prepare_version"
  retry: 1
  variables:
    # We need to override arrow's boost 1.85.0 requirement to match the version we use internally.
    EXTRA_INSTALL_ARGS: "-o arrow:with_thrift=False -o arrow:parquet=False --require=boost/1.86.0@ -o boost:without_locale=True"
  before_script:
    - uv venv .venv_conan --python ${CONAN_VENV_PYTHON} --seed
    - source .venv_conan/Scripts/activate
    - uv pip install 'conan<2' "cmake==${CMAKE_VERSION}"
    - conan config install --verify-ssl=no "${CONAN_CONFIG_URL}"
    - conan_exe=$(which conan)
    - uv python install ${PYTHON_VERSION}
    - uv venv --python "python${PYTHON_VERSION}" .venv --seed
    - source .venv/Scripts/activate
  script:
    - uv pip install build
    - !reference [".conan-build-and-test"]
  after_script:
    # HACK: for some reason, pod5_unit_tests.exe is sticking around; deleting it works, but it
    # doesn't go away immediately (as though something had it open with FILE_SHARE_DELETE, although
    # the Handle utility from SysInternals couldn't find anything).
    # This also appears to be happening for the fuzz targets, so remove and wait for every exe.
    - rm -v build/Release/bin/*.exe
    - date
    - while true; do
    -   ls build/Release/bin/*.exe || break
    -   sleep 1
    - done
    - date

win-x64-msvc2019-release-build:
  extends:
    - .build-win-common
    - .parallel-py-versions
  tags:
    - windows
    - VS2019
    - conan
  variables:
    CONAN_PROFILE: "windows-x86_64-vs2019.jinja"
    CONAN_PROFILE_CPPSTD: 17
    OUTPUT_SKU: "win-x64"
    CMAKE_ARGS: "-A x64"
    CMAKE_GENERATOR: "Visual Studio 16 2019"
  artifacts:
    name: "${CI_JOB_NAME}-artifacts"
    paths:
      - "lib_pod5*.tar.gz"
      - "lib_pod5*.whl"

# ======================================
#
#     Build Python API
#
# ======================================


build-python-api:
  stage: build
  needs:
    - "prepare_version"
  image: ${CI_REGISTRY}/traque/ont-docker-base/ont-base-python:3.10
  tags:
    - linux
  script:
    - git tag -d $(git tag -l "*a*")
    - git tag -d $(git tag -l "*b*")
    - git tag -d $(git tag -l "*r*")
    - git tag -d $(git tag -l "*c*")
    - git tag -d $(git tag -l "*dev*")
    - if [[ ${CI_COMMIT_TAG/#v/} && -z $( git tag -l "${CI_COMMIT_TAG/#v/}" ) ]]; then git tag ${CI_COMMIT_TAG/#v/}; fi
    - cat _version.py
    - VERSION=$(grep "__version__" _version.py | awk '{print $5}' | tr -d "'" | cut -d'+' -f1)
    - echo $VERSION
    - cd python/pod5/
    # update the lib_pod5 dependency in pod5/pyproject.toml to match
    - sed -i "s/.*lib_pod5.*/\ \ \ \ \'lib_pod5 == ${VERSION}\',/" pyproject.toml
    - cat pyproject.toml
    - pip install -U pip build
    - python -m build --outdir ../../
    - cd ../..
    - ls *.whl *.tar.gz
  artifacts:
    name: "${CI_JOB_NAME}-artifacts"
    paths:
      - "pod5*.whl"
      - "pod5*.tar.gz"


# ======================================
#
#     Test Tools
#
# ======================================

tools-linux-x64:
  extends:
    - .parallel-py-versions
  stage: test
  image: ${CI_REGISTRY}/traque/ont-docker-base/ont-base-python:${PYTHON_VERSION}
  tags:
    - linux
  before_script:
    - python${PYTHON_VERSION} -m venv .venv/
    - source .venv/bin/activate
  needs:
    - linux-x64-gcc9-release-build
    - build-python-api
  script:
    - pip install ./lib_pod5*cp${PYTHON_VERSION/./}*.whl pod5-*.whl
    - pod5 convert fast5 ./test_data/ --output ./output_files --one-to-one ./test_data
    - python${PYTHON_VERSION} python/pod5/test_utils/check_pod5_files_equal.py ./output_files/multi_fast5_zip.pod5 ./test_data/multi_fast5_zip_v4.pod5
    - python${PYTHON_VERSION} python/pod5/test_utils/check_pod5_files_equal.py ./output_files/multi_fast5_zip.pod5 ./test_data/multi_fast5_zip_v3.pod5
    - python${PYTHON_VERSION} python/pod5/test_utils/check_pod5_files_equal.py ./output_files/multi_fast5_zip.pod5 ./test_data/multi_fast5_zip_v2.pod5
    - python${PYTHON_VERSION} python/pod5/test_utils/check_pod5_files_equal.py ./output_files/multi_fast5_zip.pod5 ./test_data/multi_fast5_zip_v1.pod5
    - python${PYTHON_VERSION} python/pod5/test_utils/check_pod5_files_equal.py ./output_files/multi_fast5_zip.pod5 ./test_data/multi_fast5_zip_v0.pod5
    - pod5 convert to_fast5 ./output_files/ --output ./output_files
    - pod5 convert fast5 ./output_files/*.fast5 --output ./output_files_2 --one-to-one ./output_files/
    - python${PYTHON_VERSION} python/pod5/test_utils/check_pod5_files_equal.py ./output_files/multi_fast5_zip.pod5 ./output_files_2/*.pod5


# ======================================
#
#     Pytest
#
# ======================================


.pytest:
  stage: test
  before_script:
    - python${PYTHON_VERSION} -m venv .venv/
    - source .venv/*/activate
    - python --version
    - python -m pip install --upgrade pip
  script:
    - pip install ./lib_pod5*cp${PYTHON_VERSION/./}*.whl pod5-*.whl
    - pip install pytest pytest-cov pytest-mock psutil
    - pytest
    - POD5_DISABLE_MMAP_OPEN=1 pytest

.pytest-with-uv:
  extends:
    - .pytest
  before_script:
    - uv python install ${PYTHON_VERSION}
    - uv venv --python "python${PYTHON_VERSION}" .venv --seed
    - source .venv/*/activate

pytest-linux-x64:
  extends:
    - .pytest
    - .parallel-py-versions
  image: ${CI_REGISTRY}/traque/ont-docker-base/ont-base-python:${PYTHON_VERSION}
  tags:
    - linux
  needs:
    - linux-x64-gcc9-release-build
    - build-python-api

pytest-linux-aarch64:
  extends:
    - .pytest
    - .parallel-py-versions
  image: ${CI_REGISTRY}/traque/ont-docker-base/ont-base-python:${PYTHON_VERSION}
  tags:
    - linux_aarch64
    - high-cpu
  needs:
    - linux-aarch64-gcc9-release-build
    - build-python-api

pytest-osx-arm64:
  extends:
    - .pytest-with-uv
    - .parallel-py-versions
  tags:
    - osx_arm64
  needs:
    - osx-arm64-clang15-release-build
    - build-python-api

pytest-win-x64:
  retry: 1
  extends:
    - .pytest-with-uv
    - .parallel-py-versions
  tags:
    - windows
  needs:
    - win-x64-msvc2019-release-build
    - build-python-api


# ======================================
#
#     Conda Testing
#
# ======================================


conda_pytest:
  extends:
    - .pytest
    - .parallel-py-versions
  image: ${CI_REGISTRY}/minknow/pod5-file-format/conda:latest
  tags:
    - linux
  needs:
    - linux-x64-gcc9-release-build
    - build-python-api
  before_script:
    - |
      cat > environment.yml << EOF
      name: pod5_conda_test
      channels:
        - conda-forge
        - bioconda
      dependencies:
        - python=${PYTHON_VERSION}
        - cmake
        - pyarrow
        - pip
      EOF
    - cat environment.yml
    - mamba --version
    - mamba env create -f environment.yml
    - conda env list
    # This is a work around for conda init in gitlab
    - eval "$(conda shell.bash hook)"
    - conda activate pod5_conda_test


# ======================================
#
#     Benchmarks
#
# ======================================


.benchmark:
  stage: test
  before_script:
    - python3 -m venv .venv/
    - source .venv/bin/activate
  script:
    - pip install ./${LIB_WHEEL_GLOB} pod5-*.whl setuptools
    - pip install -r ./benchmarks/image/requirements-benchmarks.txt
    - ./benchmarks/image/install_slow5.sh
    - export PATH="$(pwd)/slow5tools-v1.3.0/:$PATH"
    - ./benchmarks/run_benchmarks.py ./test_data/ ./benchmark-outputs

benchmark-linux-x64:
  extends: [".benchmark"]
  image: ${CI_REGISTRY}/traque/ont-docker-base/ont-base-python:3.14
  tags:
    - linux
  needs:
    - linux-x64-gcc9-release-build
    - build-python-api
  variables:
    LIB_WHEEL_GLOB: "lib_pod5*cp314*.whl"

benchmark-linux-aarch64:
  extends: [".benchmark"]
  image: ${CI_REGISTRY}/traque/ont-docker-base/ont-base-python:3.14
  tags:
    - linux_aarch64
    - high-cpu
  needs:
    - linux-aarch64-gcc9-release-build
    - build-python-api
  variables:
    LIB_WHEEL_GLOB: "lib_pod5*cp314*.whl"


# ======================================
#
#     Fuzz tests and coverage reports
#
# ======================================

.generic-linux-x64-gcc11-build:
  stage: build
  image: external-docker.artifactory.oxfordnanolabs.local/ubuntu:jammy
  tags:
    - linux
  variables:
    CONAN_PROFILE: "linux-x86_64-gcc11.jinja"
    CONAN_PROFILE_CPPSTD: 20
    CMAKE_BUILD_TYPE: Release
  needs:
    - "prepare_version"
  script:
    # Install requirements.
    - apt-get update
    - apt-get install -y pip
    - pip install -U pip 'conan<2' auditwheel build "cmake==${CMAKE_VERSION}"
    - conan config install --verify-ssl=no ${CONAN_CONFIG_URL}
    # Setup build.
    - pod5_version="$(cmake -P ci/get_tag_version.cmake 2>&1)"
    - mkdir -p build
    - pushd build
        # Tell conan that it's OK to use libstdc++ settings.
    -   conan install
          --profile ${CONAN_PROFILE}
          -s compiler.libcxx=libstdc++11
          -s compiler.cppstd=${CONAN_PROFILE_CPPSTD}
          -s build_type=${CMAKE_BUILD_TYPE}
          -o arrow:with_boost=False
          -o arrow:with_thrift=False
          -o arrow:parquet=False
          ..
    -   cmake
          -D CMAKE_TOOLCHAIN_FILE=build/generators/conan_toolchain.cmake
          -D CMAKE_BUILD_TYPE=${CMAKE_BUILD_TYPE}
          -D BUILD_PYTHON_WHEEL=OFF
          ${CMAKE_EXTRA_ARGS}
          ..
        # Do the build
    -   cmake --build . --config ${CMAKE_BUILD_TYPE} --parallel
    - popd

linux-x64-gcc11-fuzz:
  extends: .generic-linux-x64-gcc11-build
  allow_failure: true
  variables:
    CC: clang
    CXX: clang++
    CMAKE_EXTRA_ARGS: "-D ENABLE_FUZZERS=ON -D FUZZER_RUN_TIME=600"
  script:
    # We need clang for libFuzzer.
    - apt-get update
    - apt-get install -y clang
    # Do the build.
    - !reference [".generic-linux-x64-gcc11-build", "script"]
    # Remove the zipped corpora now that we've extracted it, since we
    # don't need it artifacted.
    - rm fuzz/*.zip
    # Run the tests.
    - ctest -C Release --test-dir build -VV -R ${FUZZER_TEST}
  parallel:
    matrix:
      - FUZZER_TEST:
        - "compress"
        - "file"
  artifacts:
    # Artifact everything in /fuzz so that we can get to any new/failing corpora.
    when: always
    paths:
      - ./fuzz

linux-x64-gcc11-coverage:
  extends: .generic-linux-x64-gcc11-build
  variables:
    CMAKE_BUILD_TYPE: "Debug"
    CMAKE_EXTRA_ARGS: "-D POD5_DISABLE_TESTS=OFF -D ENABLE_COVERAGE_REPORT=ON"
  script:
    # We need a venv.
    - apt-get update
    - apt-get install -y python3-venv
    # Do the build.
    - !reference [".generic-linux-x64-gcc11-build", "script"]
    # Run the coverage report.
    - ./ci/generate_coverage_report.sh build
  coverage: '/^TOTAL\s+\d+\s+\d+\s+(\d+(?:\.\d+)?\%)$/'
  artifacts:
    reports:
      coverage_report:
        coverage_format: cobertura
        path: coverage-report-*.xml
    paths:
      # Artifact the human readable ones too.
      - coverage-report-*.html


# ======================================
#
#     Conan
#
# ======================================

.setup-venv:
  - KERNEL=$(uname -s)
  - if [[ ! ${KERNEL} =~ "Linux" ]]; then
      # Must use an explicit version here otherwise we get the windows store one.
      # Can be any version since it's only for installing conan.
  -   python3.13 -m venv .venv
  -   source .venv/*/activate
  - fi

.reset-line-endings:
  # This is needed to enforce LF line-endings in the pybind submodule
  # otherwise conan generates different revisions for windows and unix
  - re='^(MINGW|CYGWIN|MSYS).*'
  - if [[ $(uname -s) =~ $re ]]; then
  -   git rm -rf :/
  -   git checkout HEAD -- :/
  - fi

.conan-setup-common:
  - !reference [".reset-line-endings"]
  - !reference [".setup-venv"]
  - pip install 'conan<2'
  - conan --version
  - VERSIONS="$(cmake -P ci/get_tag_version.cmake 2>&1)"

.conan-build-common:
  stage: build-conan
  dependencies:
    - "prepare_version"
  before_script:
    - !reference [".conan-setup-common"]
    - conan remove "*" -f
    - conan config install --verify-ssl=no "${CONAN_CONFIG_URL}"

.conan2-common:
  before_script:
    - !reference [".reset-line-endings"]
    - !reference [".setup-venv"]
    - pip install --upgrade conan
    - conan --version
    - conan remove "*" --confirm
    - conan config install --verify-ssl=no "${CONAN2_CONFIG_URL}"

.conan2-build:
  extends: .conan2-common
  stage: build-conan
  dependencies:
    - "prepare_version"
  script:
    - version=$(cmake -P ci/get_tag_version.cmake 2>&1 | cut -d. -f1-3)
      # set up the correct ref
    - opts=("--version=${version}" --user=nanopore --channel=stable)
      # fail if we can't find dependencies
    - opts+=("--build=pod5_file_format/*")
      # select the build profile
    - opts+=(-pr:a "${PROFILE_BASE}")
      # use the arrow packages we have built
    - opts+=('-o:a=arrow/*:with_thrift=False' '-o:a=arrow/*:parquet=False' '-o:a=arrow/*:with_zstd=True' '-o:a=arrow/*:with_boost=False')
    - echo "Running conan create . ${opts[@]}"
    - conan create . "${opts[@]}"
    - conan cache save "*/*:*" --file=conan-${CI_JOB_ID}.tgz
  variables:
    # use an arrow package that doesn't use Boost, even on Windows
    CONAN_MANUAL_OVERRIDES: "arrow/*:arrow/18.0.0@nanopore/noboost"
    CONAN_PROFILE_CPPSTD: "20"
  artifacts:
    paths:
      - 'conan-*.tgz'
  parallel:
    matrix:
      - CONAN_PROFILE_BUILD_TYPE: ["Debug", "Release"]

.conan2-upload:
  extends: .conan2-common
  stage: deploy
  #only: ["tags"]
  script:
    - for f in conan-*.tgz; do conan cache restore "$f"; done
    - conan remote auth ONT-Conan-V2 --force
    - conan upload "*:*" --check --confirm --remote=ONT-Conan-V2 --dry-run

.conan-upload:
  extends: .upload-package # from informatics/conan-config
  stage: deploy
  only: ["tags"]
  before_script:
    - pip install "cmake==${CMAKE_VERSION}"
    - !reference [".conan-setup-common"]
  variables:
      EXPECTED_PACKAGE_COUNT: "4" # Expect shared and static packages

# Conan: build and upload packages:
build-conan:windows-x86_64-vs2019:
    extends:
        - .profile-windows-x86_64-vs2019
        - .build-package-win
        - .conan-build-common
        - .build-shared-and-static
    needs: ["prepare_version", "win-x64-msvc2019-release-build"]
upload-conan:windows-x86_64-vs2019:
    extends: .conan-upload
    dependencies: [ "prepare_version", "build-conan:windows-x86_64-vs2019" ]

build-conan2:windows-x86_64-vs2019:
    extends:
        - .conan2-build
        - .profile-windows-x86_64-vs2019-conan2
    needs: ["prepare_version", "win-x64-msvc2019-release-build"]
upload-conan2:windows-x86_64-vs2019:
    extends:
        - .conan2-upload
        - .profile-windows-x86_64-vs2019-conan2
    dependencies: [ "prepare_version", "build-conan2:windows-x86_64-vs2019" ]

build-conan:macos-aarch64-appleclang-15.0:
    extends:
        - .profile-macos-aarch64-appleclang-15.0
        - .build-package
        - .conan-build-common
        - .build-shared-and-static
    needs: ["prepare_version", "osx-arm64-clang15-release-build"]
upload-conan:macos-aarch64-appleclang-15.0:
    extends: .conan-upload
    dependencies: [ "prepare_version", "build-conan:macos-aarch64-appleclang-15.0" ]

build-conan:macos-aarch64-appleclang-16.0:
    extends:
        - .profile-macos-aarch64-appleclang-16.0
        - .build-package
        - .conan-build-common
        - .build-shared-and-static
    needs: ["prepare_version"]
upload-conan:macos-aarch64-appleclang-16.0:
    extends: .conan-upload
    dependencies: [ "prepare_version", "build-conan:macos-aarch64-appleclang-16.0" ]

build-conan2:macos-aarch64-appleclang-15.0:
    extends:
        - .profile-macos-aarch64-appleclang-15.0-conan2
        - .conan2-build
    needs: ["prepare_version", "osx-arm64-clang15-release-build"]
upload-conan2:macos-aarch64-appleclang-15.0:
    extends:
      - .profile-macos-aarch64-appleclang-15.0-conan2
      - .conan2-upload
    dependencies: [ "prepare_version", "build-conan2:macos-aarch64-appleclang-15.0" ]

build-conan2:macos-aarch64-appleclang-16.0:
    extends:
        - .profile-macos-aarch64-appleclang-16.0-conan2
        - .conan2-build
    needs: ["prepare_version"]
upload-conan2:macos-aarch64-appleclang-16.0:
    extends:
        - .profile-macos-aarch64-appleclang-16.0-conan2
        - .conan2-upload
    dependencies: [ "prepare_version", "build-conan2:macos-aarch64-appleclang-16.0" ]

build-conan:linux-x86_64-gcc11:
    extends:
        - .profile-linux-x86_64-gcc11
        - .build-package
        - .conan-build-common
        - .build-shared-and-static
    needs: ["prepare_version"]
upload-conan:linux-x86_64-gcc11:
    extends: .conan-upload
    dependencies: [ "prepare_version", "build-conan:linux-x86_64-gcc11" ]

build-conan2:linux-x86_64-gcc11:
    extends:
        - .profile-linux-x86_64-gcc11-conan2
        - .conan2-build
    needs: ["prepare_version"]
upload-conan2:linux-x86_64-gcc11:
    extends:
        - .profile-linux-x86_64-gcc11-conan2
        - .conan2-upload
    dependencies: [ "prepare_version", "build-conan2:linux-x86_64-gcc11" ]

build-conan2:linux-x86_64-gcc11-asan-static:
    extends:
        - .profile-linux-x86_64-gcc11-asan-static-conan2
        - .conan2-build
    needs: ["prepare_version"]
upload-conan2:linux-x86_64-gcc11-asan-static:
    extends:
        - .profile-linux-x86_64-gcc11-asan-static-conan2
        - .conan2-upload
    dependencies: [ "prepare_version", "build-conan2:linux-x86_64-gcc11-asan-static" ]

build-conan2:linux-x86_64-gcc11-usan-static:
    extends:
        - .profile-linux-x86_64-gcc11-usan-static-conan2
        - .conan2-build
    needs: ["prepare_version"]
upload-conan2:linux-x86_64-gcc11-usan-static:
    extends:
        - .profile-linux-x86_64-gcc11-usan-static-conan2
        - .conan2-upload
    dependencies: [ "prepare_version", "build-conan2:linux-x86_64-gcc11-usan-static" ]

build-conan2:linux-x86_64-gcc11-tsan-static:
    extends:
        - .profile-linux-x86_64-gcc11-tsan-static-conan2
        - .conan2-build
    needs: ["prepare_version"]
upload-conan2:linux-x86_64-gcc11-tsan-static:
    extends:
        - .profile-linux-x86_64-gcc11-tsan-static-conan2
        - .conan2-upload
    dependencies: [ "prepare_version", "build-conan2:linux-x86_64-gcc11-tsan-static" ]

build-conan:linux-x86_64-gcc13:
    extends:
        - .profile-linux-x86_64-gcc13
        - .build-package
        - .conan-build-common
        - .build-shared-and-static
    needs: ["prepare_version"]
upload-conan:linux-x86_64-gcc13:
    extends: .conan-upload
    dependencies: [ "prepare_version", "build-conan:linux-x86_64-gcc13" ]

build-conan2:linux-x86_64-gcc13:
    extends:
        - .profile-linux-x86_64-gcc13-conan2
        - .conan2-build
    needs: ["prepare_version"]
upload-conan2:linux-x86_64-gcc13:
    extends:
        - .profile-linux-x86_64-gcc13-conan2
        - .conan2-upload
    dependencies: [ "prepare_version", "build-conan2:linux-x86_64-gcc13" ]

build-conan:linux-x86_64-gcc11-asan-static:
    extends:
        - .profile-linux-x86_64-gcc11-asan-static
        - .build-package
        - .conan-build-common
        - .build-shared-and-static
    needs: ["prepare_version"]
upload-conan:linux-x86_64-gcc11-asan-static:
    extends: .conan-upload
    dependencies: [ "prepare_version", "build-conan:linux-x86_64-gcc11-asan-static" ]

build-conan:linux-x86_64-gcc13-asan-static:
    extends:
        - .profile-linux-x86_64-gcc13-asan-static
        - .build-package
        - .conan-build-common
        - .build-shared-and-static
    needs: ["prepare_version"]
upload-conan:linux-x86_64-gcc13-asan-static:
    extends: .conan-upload
    dependencies: [ "prepare_version", "build-conan:linux-x86_64-gcc13-asan-static" ]

build-conan:linux-x86_64-gcc11-tsan-static:
    extends:
        - .profile-linux-x86_64-gcc11-tsan-static
        - .build-package
        - .conan-build-common
        - .build-shared-and-static
    needs: ["prepare_version"]
upload-conan:linux-x86_64-gcc11-tsan-static:
    extends: .conan-upload
    dependencies: [ "prepare_version", "build-conan:linux-x86_64-gcc11-tsan-static" ]

build-conan:linux-x86_64-gcc13-tsan-static:
    extends:
        - .profile-linux-x86_64-gcc13-tsan-static
        - .build-package
        - .conan-build-common
        - .build-shared-and-static
    needs: ["prepare_version"]
upload-conan:linux-x86_64-gcc13-tsan-static:
    extends: .conan-upload
    dependencies: [ "prepare_version", "build-conan:linux-x86_64-gcc13-tsan-static" ]

build-conan:linux-x86_64-gcc11-usan-static:
    extends:
        - .profile-linux-x86_64-gcc11-usan-static
        - .build-package
        - .conan-build-common
        - .build-shared-and-static
    needs: ["prepare_version"]
upload-conan:linux-x86_64-gcc11-usan-static:
    extends: .conan-upload
    dependencies: [ "prepare_version", "build-conan:linux-x86_64-gcc11-usan-static" ]

build-conan:linux-x86_64-gcc13-usan-static:
    extends:
        - .profile-linux-x86_64-gcc13-usan-static
        - .build-package
        - .conan-build-common
        - .build-shared-and-static
    needs: ["prepare_version"]
upload-conan:linux-x86_64-gcc13-usan-static:
    extends: .conan-upload
    dependencies: [ "prepare_version", "build-conan:linux-x86_64-gcc13-usan-static" ]

build-conan:linux-aarch64-gcc11:
    extends:
        - .profile-linux-aarch64-gcc11
        - .build-package
        - .conan-build-common
        - .build-shared-and-static
    needs: ["prepare_version"]
upload-conan:linux-aarch64-gcc11:
    extends: .conan-upload
    dependencies: [ "prepare_version", "build-conan:linux-aarch64-gcc11" ]

build-conan2:linux-aarch64-gcc11:
    extends:
        - .profile-linux-aarch64-gcc11-conan2
        - .conan2-build
    needs: ["prepare_version"]
upload-conan2:linux-aarch64-gcc11:
    extends:
        - .profile-linux-aarch64-gcc11-conan2
        - .conan2-upload
    dependencies: [ "prepare_version", "build-conan2:linux-aarch64-gcc11" ]

build-conan:linux-aarch64-gcc13:
    extends:
        - .profile-linux-aarch64-gcc13
        - .build-package
        - .conan-build-common
        - .build-shared-and-static
    needs: ["prepare_version"]
upload-conan:linux-aarch64-gcc13:
    extends: .conan-upload
    dependencies: [ "prepare_version", "build-conan:linux-aarch64-gcc13" ]

build-conan2:linux-aarch64-gcc13:
    extends:
        - .profile-linux-aarch64-gcc13-conan2
        - .conan2-build
    needs: ["prepare_version"]
upload-conan2:linux-aarch64-gcc13:
    extends:
        - .profile-linux-aarch64-gcc13-conan2
        - .conan2-upload
    dependencies: [ "prepare_version", "build-conan2:linux-aarch64-gcc13" ]

# ======================================
#
#     Archive
#
# ======================================


build-archive:
  stage: archive
  needs:
    - linux-x64-gcc9-release-build
    - linux-aarch64-gcc9-release-build
    - osx-arm64-clang15-release-build
    - win-x64-msvc2019-release-build
    - build-python-api
  script:
    - find .
  artifacts:
    name: "${CI_JOB_NAME}-artifacts"
    paths:
      - ./*.tar.gz
      - ./*.whl


# ======================================
#
#     Deploy
#
# ======================================


internal_wheel_upload:
  stage: deploy
  image: ${UPLOAD_PYTHON_IMAGE}
  needs:
    - build-archive
  script:
    - ls -lh .
    - pip install twine
    - twine upload *.whl pod5*.tar.gz
  only: ["tags"]
  when: manual

external_wheel_upload:
  stage: deploy
  image: ${UPLOAD_PYTHON_IMAGE}
  needs:
    - build-archive
  script:
    - ls -lh .
    - pip install twine
    - unset TWINE_REPOSITORY_URL
    - unset TWINE_CERT
    - twine upload lib*.whl -u __token__ -p"${EXTERNAL_LIB_POD5_PYPI_KEY}"
    - twine upload pod5*.whl pod5*.tar.gz -u __token__ -p"${EXTERNAL_POD5_PYPI_KEY}"
  only: ["tags"]
  when: manual


# ======================================
#
#     MLHub Testing
#
# ======================================

mlhub:
  stage: deploy
  image: ${MLHUB_TRIGGER_IMAGE}
  needs: ["build-archive"]
  variables:
    GIT_STRATEGY: none
  script:
    - |
      curl -i --header "Content-Type: application/json" \
      --request POST \
      --data '{
          "key": "'${MLHUB_TRIGGER_KEY}'",
          "job_name": "POD5-CI '${CI_COMMIT_REF_NAME}' - '"$CI_COMMIT_TITLE"' ",
          "script_parameters": {
                "mode":"artifact",
                "source":"'${CI_COMMIT_SHA}'"
                "python_ver":"'${PYTHON_VERSION}'"
              }
      }' \
      ${MLHUB_TRIGGER_URL}
  when: manual
  extends:
    - .parallel-py-versions


================================================
FILE: .gitmodules
================================================
[submodule "third_party/pybind11"]
	path = third_party/pybind11
	url = https://github.com/pybind/pybind11.git
	branch = stable


================================================
FILE: .pre-commit-config.yaml
================================================
# See https://pre-commit.com for more information
# See https://pre-commit.com/hooks.html for more hooks
repos:
  - repo: https://github.com/pre-commit/pre-commit-hooks
    rev: v5.0.0
    hooks:
      - id: trailing-whitespace
      - id: end-of-file-fixer
      - id: check-case-conflict
      - id: check-merge-conflict
      - id: check-added-large-files
  - repo: https://github.com/psf/black
    rev: 25.1.0
    hooks:
      - id: black
  - repo: https://github.com/codespell-project/codespell
    rev: v2.4.1
    hooks:
      - id: codespell
        exclude: 'third_party/'
  - repo: https://github.com/PyCQA/flake8
    rev: 7.2.0
    hooks:
      - id: flake8
        exclude: docs/conf.py
  - repo: https://github.com/shellcheck-py/shellcheck-py
    rev: v0.10.0.1
    hooks:
      - id: shellcheck
  - repo: https://github.com/pre-commit/mirrors-clang-format
    rev: 'v20.1.4'
    hooks:
      - id: clang-format
        exclude: 'third_party/'
  - repo: https://github.com/pre-commit/mirrors-mypy
    rev: 'v1.15.0'
    hooks:
      - id: mypy
        files: 'python/pod5/src/'
        args: [ --check-untyped-defs, --ignore-missing-imports ]
        additional_dependencies:
          - types-Deprecated
          - types-setuptools
          - types-pytz

# NB: by default, pre-commit only installs the pre-commit hook ("commit" stage),
# but you can tell `pre-commit install` to install other hooks.
# This set of default stages ensures we don't slow down or break other git operations
# even if you install hooks for them.
default_stages:
  - pre-commit
  - pre-merge-commit
  - manual

# vi:et:sw=2:sts=2:


================================================
FILE: .readthedocs.yaml
================================================
# Read the Docs configuration file
# See https://docs.readthedocs.io/en/stable/config-file/v2.html for details

# Required
version: 2

# Build all formats
formats: all

# Set the version of Python and other tools you might need
build:
   os: ubuntu-20.04
   tools:
      python: "3.10"
   jobs:
      pre_build:
         - python -c "import pod5; print(pod5.__version__)"
# Build documentation in the docs/ directory with Sphinx
sphinx:
   configuration: docs/conf.py

# If using Sphinx, optionally build your docs in additional formats such as PDF
# formats:
#    - pdf

# Optionally declare the Python requirements required to build your docs
python:
   install:
      - requirements: docs/requirements.txt


================================================
FILE: CHANGELOG.md
================================================
<!-- markdownlint-disable MD024 -->

# Changelog

All notable changes, updates, and fixes to pod5 will be documented here

The format is based on [Keep a Changelog](http://keepachangelog.com/en/1.0.0/)
and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0.html).

## [0.3.39]

### Fixed

- Fix python bindings build without Conan.

### Changed

- CI Stabilisation

## [0.3.38]

### Changed

- CI Stabilisation

## [0.3.37]

### Changed

- Use standard file IO to read POD5 header and footer metadata before memory mapping (if not disabled e.g. `POD5_DISABLE_MMAP_OPEN=1`). This should to avoid SIGBUS errors caused by memory mapping file stubs (archive artefacts).
- Improve file_reader_writer unit-tests robustness
- Scale number of open input file handles during pod5 subset / filter by the system limits and number of output files.

### Fixed

- Fixed bug where invalid read ids could be passed into pod5 subset via summary table.
- Fixed bug where invalid read ids in `DatasetReader.reads` selection could return valid read records.
- Fixed bug in CI where the python venv was not activated resulting in incorrect conan version being used.

## [0.3.36]

### Added

- Added missing licence files.

### Removed

- Removed Python 3.9 and macOS 10.15 support since they're EOL.

## [0.3.35]

### Added

- Python 3.14 support

### Removed

- Removed sphinx-style python docstrings references
- Removed most documentation as part of migration to <https://software-docs.nanoporetech.com/pod5>
- Deprecated `--duplicate-ok` argument from pod5 tools - duplicating reads is now always invalid.

### Changed

- Moved filter + subset implementation into C++ for improved performance.
- Performance improvements to `pod5 view` especially when reading read ids from large files.
- Updated polars version from "~=1.20,<1.32" to "~= 1.30"
- Switch to uv for managing CI python environments
- Updated to pyarrow 22.0.0

## [0.3.34]

### Added

- `open_pore_level` to `pod5 inspect read`

### Changed

- Fixed migration behaviour on nfs systems, where migrated tables could be left orphaned on disk.
- Limited polars install version to "~=1.20,<1.32" following breaking changes
- Tidied up how tmp files are named, used a larger set of numbers for naming.

## [0.3.33]

### Added

- Added Conan 2 CI

### Changed

- Reduced virtual memory usage when opening POD5 files by 75%.
- Python API now memory maps inner tables using the `mmap.mmap` `offset` and `length` arguments directly instead of taking a slice of the whole file.

## [0.3.32]

### Added

- Option to allow users of C++ API to not keep file handles open if required.

### Changed

- Order of `pod5 view` is backwards compatible with 0.3.30, new `open_pore_level` field is at the end of the list.

## [0.3.31]

### Added

- Added new field `open_pore_level`, containing the level of the open pore as tracked by MinKNOW for this channel/well.

### Removed

- Deprecated support for unused read scaling values "tracked_scaling_scale", "tracked_scaling_shift", "predicted_scaling_scale", "predicted_scaling_shift", "num_reads_since_mux_change" and "time_since_mux_change". These will be removed from stored data and writer API in 0.4.0, with accessing API remaining in place until 0.5.0.

## [0.3.30]

### Changed

- Build with sanitization on GCC13

### Removed

- Dropped incorrect sanitized conan jobs.

## [0.3.29]

### Removed

- Dropped support for macOS x86

## [0.3.28]

### Changed

- Additional testing for Linux file access.

## [0.3.27]

### Fixed

- Fixed some crashes when parsing corrupt POD5 files.
- Fixed missing error handling when the C API is called incorrectly.
- Fixed and clarified C API thread safety.
- Fall back to regular IO if direct IO is requested, but file opening fails.

### Removed

- Dropped automated ARM+GCC8 builds.

### Changed

- Bumped polars to next major version (`~= 1.20`).

## [0.3.26]

### Changed

- The read end reason now includes paused - for reads that ended because acquisition was paused.

## [0.3.25]

### Changed

- Python 3.8 wheels are no longer built for Windows or macOS (Python 3.8 is end-of-life).
- Better error messages and testing of file recovery.

### Added

- Conan pod5 builds with address, thread and undefined behaviour sanitizer support.
- Added fuzz testing.
- New option cleanup temporary files after file recovery.

## [0.3.24]

### Changed

- Update to arrow 18 for the cpp library.

### Fixed

- Flush `pod5 view` header to prevent issue on Windows systems where header would not be on top.

## [0.3.23]

### Changed

- Removed use of python `build` when building wheel in cmake.

## [0.3.22]

### Added

- `ArrowTableHandle` `stream` member to store the `BatchFileReader` backend
- `ArrowTableHandle` `options` argument to pass in `IpcReadOptions`
- `pod5::default_memory_pool` function which selects an appropriate memory pool even on large page systems.

### Changed

- Refactored Multi-threading in `DatasetReader` to prevent too many open files errors
- Updated dependency to `pyarrow~=18.0.0` for `python>=3.9`
- Relaxed h5py python dependency

## [0.3.21]

### Added

- Support for python 3.13.

### Changed

- Removed use of Boost. This does not affect the C interface, but may require changes to
  consumers of the C++ headers.

## [0.3.20]

### Changed

- Refactored directio writing engine to open up async io support.
- Fixed Boost version compatibility checking in Conan packages.

## [0.3.19]

### Added

- New end reason for reads terminated due to an analysis configuration change.

### Changed

- Reduced allocations when compressing signal.

### Fixed

- Crash when searching empty file for reads.

## [0.3.18]

### Added

- Ability to disable flushing on batch complete
- Use new LinuxOutputStream to cache allocations and reduce memory when writing many files.

## [0.3.17]

### Changed

- Move svb headers to correct subdirectory in

## [0.3.16]

### Added

- svb16 headers packaged with pod5

### Changed

- Directio output now writes on batch complete without flushing explicitly.

## [0.3.15]

### Added

- Added new end reasons "api_request" and "device_data_error" to allow for new read end reasons future minknow versions will generate.
- Allow directio to specify the chunk size directly.

## [0.3.14]

### Added

- gcc8 builds

## [0.3.13]

### Fixed

- Instability when creating a pod5 writer fails.
- Issue with directio mode where space is over reserved.

## [0.3.12]

### Fixed

- Fixed issues reading signal from uncompressed pod5 files.

## [0.3.11]

### Added

- Typechecking on `Writer.add_reads` to inform users incorrectly passing `ReadRecords`
- Compatibility with numpy 2.0.

### Fixed

- `DatasetReader` correctly handles string paths

## [0.3.10]

### Added

- Required pypa project metadata.

### Removed

- Dropped support OSX builds for XCode < 14.2.

## [0.3.9]

### Fixed

- `ReadRecord.to_read()` missing fields

## [0.3.8]

### Fixed

- Conan windows upload jobs failure due to using different line endings.

## [0.3.7]

### Fixed

- CI package uploading to PyPi following [API token migration](https://pypi.org/help/#apitoken).
- Documentation for some functions.
- Explicitly sized type in `pod5_vbz_decompress_signal()`.
- CI execution of tests.

### Changed

- Updated `pre-commit` to `clang-format-17`.
- Updated Arrow to 12.0.0.

## [0.3.6]

### Fixed

- Polars `ColumnNotFoundError: not_set` introduced by `polars==0.20.0`

## [0.3.5]

### Fixed

- Arrow build flags in conanfile are now configured in the configure() fnc rather than being default options.

## [0.3.4]

### Added

- boost_internal_build flag in conanfile.
- CI now builds with the above flag turned on.

## [0.3.3]

### Added

- CI for appleclang 14
- cppstd builds

## [0.3.2]

### Added

- Support for Python 3.12

## [0.3.1] 2023-11-10

### Fixed

- Logging no longer calls `basicConfig` which may unintentionally edit users logging configuration

## [0.3.0] 2023-11-07

### Changed

- Transfers dataframes used in subsetting / filter use categorical fields to reduce memory consumption
- Polars version increased to `~=0.19`
- Documentation regarding positional arguments
- Renamed deprecated `polars.groupby` to `polars.group_by`

### Fixed

- Fixed a bug in the build scripts that prevented iOS and Windows Conan packages from being uploaded.
- Remove exposed artifactory URL env var from gitlab ci config.
- `convert to_fast5` writes byte encoded read_ids to match Minkow (was `str`)

### Removed

- Removed python3.7 support

## [0.2.9] 2023-11-02

### Fixed

- Corrected the visibility of dependencies when building pod5 as a shared library.

## [0.2.8] 2023-11-01

### Added

- Added compression status to `pod5 inspect summary <file>`
- Added environment override "POD5_DISABLE_MMAP_OPEN" to force non-mmapped opening of files.

### Fixed

- Remove exposed artifactory URL env var from gitlab ci config.
- `convert to_fast5` writes byte encoded read_ids to match Minkow (was `str`)

## [0.2.7] 2023-09-11

### Added

- `DatasetReader` class for reading collections of pod5 files
- Return index errors when querying invalid errors from API's

### Changed

- Recursive search for files now traverses symbolic links and ignores hidden files
- Tweak block size of directio writes to 1MB.

## [0.2.6] 2023-09-04

### Changed

- Write pod5 files using DirectIO on Linux platforms (performance)

## [0.2.5] 2023-08-01

### Added

- Shared builds to conan

### Fixed

- `num_minknow_events` field description from `int8` to `uint64`
- `ReadRecord.num_minknow_events` return type-hint from `float` to `int`

## [0.2.4] 2023-07-13

### Changed

- Increased `numpy` minimum version to `>= 1.21.0`
- Improved performance of `subset`, `filter` and `merge` tools.
- `Repacker.wait` and `Repacker.waiter` parameters

### Deprecated

- `Repacker.wait` and `Repacker.waiter` some parameters are deprecated and issue `FutureWarning`

### Fixed

- `Repacker.is_complete` returning `True` when work is queued.

## [0.2.3] 2023-06-26

### Added

- Add API (pod5_open_file_options) to prevent pod5 from opening a file using mmap, instead using direct file IO.
- Default field values (empty string) when converting fast5 files with missing fields

### Changed

- Corrected Oxford Nanopore Technologies company name in package metadata to use Public Limited Company (Plc) instead of Limited (Ltd)
- Limited the number of processes created when specifying `--threads` to the number of cpu cores available `os.cpu_count()`
- Reduced the default value for `--threads` from 8 to 4 to improve stability on resource constrained systems

## [0.2.2] 2023-06-06

### Fixed

- Add API error when adding reads with invalid end reason, pore type or run info.

## [0.2.1] 2023-05-25

### Changed

- Update internal arrow lib to not export flatbuffers symbols.

## [0.2.0] 2023-05-18

### Added

- `pod5 view` tool to view / inspect pod5 files as tables. Gives a >200x speed improvement compared to `pod5 inspect reads`
- `pod5 recover` tool to recover data from corrupted / truncated pod5 files
- `pod5 update` documentation
- source distributions to pypi

### Changed

- `pod5 subset` and `pod5 filter` uses `polars` to parse inputs
- `pod5 subset` and `pod5 filter` csv formatting requirements tightened
- `pod5` tools which use multiple pod5 file inputs now accept directories which can be searched recursively with `-r/--recursive`
- `pod5 subset` `--read-id-column` argument abbreviateion `-r` change to `-R` to allow `-r/--recursive` to be consistent for all tools
- `pod5` tools use hyphens in all arguments (e.g. `--force-overwrite` and `--read-id-column`)
- `pod5 merge` and `pod5 update` uses named `-o/--output` argument instead of positional `output` argument to standardise tools
- `pod5 update` progress bar and better detection of name conflicts
- Minimised number of open file handles in tools to prevent `Too many open files` error
- Logging added to `merge`, `filter` and `subset`. Enabled with `POD5_DEBUG=1`

### Deprecated

- `pod5 inspect reads` deprecated in-favour of `pod5 view`

### Fixed

- Exception raised when calling `pod5` without any arguments
- Exception raised in `pod5 convert fast5` where closed writers were reopened after being closed by a caught exception
- Fixed Gitlab 38, pod5_get_end_reason and pod5_get_pore_type ignoring input string length checks.

### Removed

- `pod5 subset` `--json` mapping arguments
- `pod5 merge` `--chunk-size` argument
- `ReadTableVersion` replaced with an integer value

## [0.1.21] 2023-04-27

### Fixed

- Repacker `reads_completed` value while copying a selection of reads.
- Fixed crash when trying to load files with a bad footer.

## [0.1.20] 2023-04-20

### Fixed

- Fixed merging many files running out the size limit of dictionary indices.

## [0.1.19] 2023-04-14

### Changed

- `pod5 convert fast5` now creates logs when `POD5_DEBUG=1` set
- `pod5 convert fast5` checks multi-read fast5s at conversion time

### Fixed

- Fixed memory usage growth over time as signal was loaded with large pod5 files.
- Fixed crash loading malicious files (found via fuzz testing)
- Fixed leaks and UB when running unit tests.
- Fixed run-away memory consumption during fast5 conversion

## [0.1.17] 2023-04-06

### Changed

- Updated internal arrow version to 8.0.0.3

## [0.1.16] 2023-04-06

### Fixed

- Fixed issue where pod5 would read out of bounds memory when decompressing some reads.

## [0.1.15] 2023-03-31

### Changed

- Refactored `pod5 convert fast5` to use `concurrent.futures` only.
- Add further info to error message when signal cannot be decompressed by zstd
- Make merge operation not generate multiple identical run infos.

### Fixed

- Fixed closing uninitialised file handles.
- Fixed `pod5 inspect reads` repeating header
- Fixed a crash with certain pod5 search operations.

## [0.1.13] 2023-03-23

### Fixed

- Fix loading large pod5 files on virtual-memory limited systems.

## [0.1.12] 2023-03-20

### Added

- Added `--output` argument to `pod5 convert fast5` and `to_fast5` replacing positional argument of the same name
- Added `--strict` argument to `pod5 convert fast5` to promptly stop on exceptions
- Added readthedocs documentation links in README.md

### Changed

- Updated developer installation instructions to use `conan<2`
- Reworked `pod5 convert fast5` to tolerate runtime exceptions
- Use same type `run_info_index_t` for `pod5_get_file_run_info_count` and `pod5_get_file_run_info`.

### Fixed

- Fixed file handle leak in repacker

## [0.1.11] 2023-03-13

### Added

- Python API supports python 3.11
- Added missing python API wheels on windows

### Changed

- Changed python API dependency version `pyarrow~=11.0.0` from `8.0.0` to support python 3.11
- Changed python API dependency version `hdf5~=8.0.0` from `v7.0.0` to support python 3.11

## [0.1.10] 2023-03-09

### Added

- Added `pod5_get_read_count` to find the count of all reads in file
- Added `pod5_get_read_ids` to retrieve all read id's in file
- Added `pod5_get_file_run_info` to retrieve a run info at an absolute index in the file
- Added `pod5_free_run_info` to free run info's (replaces `pod5_release_run_info`)
- Added `pod5_get_file_run_info_count` to find the number of run info's in a file
- Added `pod5 filter` tool to subset pod5 files with simple list of read ids
- Added `tqdm` progress bar to `pod5 subset` (disable with `POD5_PBAR=0`)

### Changed

- Reworked `pod5 subset` to give better control over resources used
- `pod5 subset` can now parse csv and tsv tables / summaries
- `pod5 repack` now repacks all inputs one-to-one

### Deprecated

- Deprecated `pod5_release_run_info` (see `pod5_free_run_info`)

### Removed

- Removed filepath header line from `pod5 inspect reads`

## [0.1.9] 2023-03-07

### Added

- Added version attributes to `lib-pod5`

### Changed

- Versioning now controlled by VCS inspection using `setuptools_scm`

## [0.1.8] 2023-02-23

### Added

- Added more `read_id` getter methods to `Reader`
- Added support for python 3.8 + 3.10 on windows
- Added gcc7 linux build of pod5

### Changed

- Update to zlib 1.2.13
- Update to zstd 1.5.4
- Pinned `pre-commit=v2.21.0` while supporting `python3.7`
- Reworked `pod5 convert to_fast5` output filenames to allow for `1-1` mapping

### Fixed

- Fixed `pod5 inspect read`
- Fixed `pod5 convert to_fast5` creating an empty fast5 output
- Fixed `pod5 convert to_fast5` ignoring the `--force_overwrite` argument
- Fixed issue where thread_pool.h wasn't shipped.

## [0.1.5] - 2023-01-20

### Added

- Explicitly re-exported `lib-pod5` public symbols and added `py.typed` marker file to support type-checking.

### Fixed

- Fixed issue where closing many pod5 files in sequence is slow.
- Fixed incorrect python types and adopted python type-checking.

## [0.1.4] - 2022-12-22

### Added

- Linux python 3.11 wheels
- ReadTheDocs documentation support

### Fixed

- OSX arm64 wheel naming corrections - works with wider set of python executables

## [0.1.3] - 2022-12-16

### Added

- Added `Reader.__iter__` method.

### Changed

- Renamed `EndReason.name` to `EndReason.reason` to access the inner enum and added
  `EndReason.name` as a property to return the string representation of this enum value.
- `BaseRead`, `Read`, `CompressedRead`, `Calibration` and `Pore` dataclasses are now mutable.

### Removed

- Removed deprecated `Writer` functions.

### Fixed

- Fixed osx arm64 wheel compatibility for older python versions.
- Fixed EndReason type errors.
- Fixed EndReason in pod5 to fast5 conversion.

## [0.1.2] - 2022-12-06

### Changed

- Optimised the file writing utilities

## [0.1.1] - 2022-12-06

### Changed

- Restricted exported boost dependencies of conan package to just the boost::headers component.

## [0.1] - 2022-12-02

### Changed

- Documentation edits
- `Writer.add_reads` now handles both `Read` and `CompressedRead`.

### Deprecated

- Deprecated `Writer` methods `add_read_object` and `add_read_objects` for `add_read` and `add_reads` respectively.

### Removed

- Removed direct pod5 tool scripts.

### Fixed

- Fixed name of internal utils - "pad_file".
- Fixed spelling of various internal variables.
- Fixed `pod5 convert to_fast5`

## [0.0.43]

### Changed

- Reformat c++ code with more consistent format file.

## [0.0.42]

### Added

- Added `pod5` tools entry-point
- Added api to query file version information as written on disk.

### Changed

- Fixed signal_chunk_size type error in convert-from-fast5
- Replaced `ont_fast5_api` dependency with `vbz_h5py_plugin`
- Restructured Python packaging to include `lib_pod5_format` which contains the native bindings build from pybind11.
- `pod5_format` and `pod5_format_tools` are now pure python packages which depend on `lib_pod5_format`
- Python packages `pod5_format` and `pod5_format_tools` have been merged into single `pod5` pure-python package.
- `pod5-convert-from-fast5` `--output-one-to-one` reworked so that output files maintain the input structure making this argument more flexible and avoid filename clobbering.
- Added missing `lib_pod5.update_file` function to pyi.
- `pod5-convert-from-fast5` `output` now takes existing directories and
  writes `output.pod5` (current behaviour) or creates a new file with the given name if it doesn't exist.
- Renamed arguments in tools relating to multi-processing / multi-threading from `-p/--processes` to the mode common `-t/--threads`.

## [0.0.41] - 2022-10-27

### Changed

- Fixed pod5-inspect erroring when loading data.
- Fixed issue where some files in between 0.34 - 0.38 wouldn't load correctly.

## [0.0.40] - 2022-10-27

### Changed

- Fixed migrating of large files from older versions.

## [0.0.39] - 2022-10-18

### Changed

- Fixed building against the c++ api - previously missing include files.

## [0.0.38] - 2022-10-18

### Changed

- All data in the read table that was previously contained in dictionaries of structs is now stored in the read table, or a new "run info" table.
  This change simplifies data access into the pod5 files, and helps users who want to convert the pod5 data to pandas or other arrow-compatible reader formats.
  Old data is migrated on load, and will continue to work, data can be permanently migrated using the tool `pod5-migrate`

### Removed

- Support for opening and writing "split" pod5 files. All API's now expect and return combined pod5 files.

## [0.0.37] - 2022-10-18

### Changed

- Updated Conan recipe to support building without specifying C++ standard version.

## [0.0.36] - 2022-10-07

### Changed

- Bump the Boost and Arrow versions to pick up latest changes.

## [0.0.35] - 2022-10-07

### Changed

- Support C++17 + C++20 with the conan package pod5 generates.

## [0.0.34] - 2022-10-05

### Changed

- Modified `pod5_format_tools/pod5_convert_to_fast5.py` to separate `pod5_convert_to_fast5_argparser()` and `convert_from_fast5()` out from `pod5_convert_from_fast5.main()`.

## [0.0.33] - 2022-10-05

### Added

- Added `num_samples` field to read table, containing the total number of samples a read contains. The field is filled in by API if it doesn't exist.

### Changed

- File version is now V2, due to the addition of `num_samples`.

## [0.0.32] - 2022-10-03

### Fixed

- Fixed an issue where multi-threaded access to a single batch could cause a crash discovered by dorado testing.
- Fixed help text in convert to fast5 script.


================================================
FILE: CMakeLists.txt
================================================
cmake_minimum_required(VERSION 3.18.0)

project(POD5)

include(${PROJECT_SOURCE_DIR}/cmake/POD5Version.cmake)

set(CMAKE_PROJECT_VERSION ${POD5_NUMERIC_VERSION})

set(CMAKE_MODULE_PATH ${CMAKE_MODULE_PATH} "${PROJECT_SOURCE_DIR}/cmake")

# use compiler cache if available
option(DISABLE_CCACHE "Do not try to use ccache to speed compilation" NO)
if (NOT DISABLE_CCACHE)
    find_program(CCACHE_EXECUTABLE ccache
        HINTS "C:/Program\ Files/ccache/"
        )
    if (CCACHE_EXECUTABLE)
        message(STATUS "Using ccache: ${CCACHE_EXECUTABLE}")
        set(CMAKE_CXX_COMPILER_LAUNCHER "${CCACHE_EXECUTABLE}")
        set(CMAKE_C_COMPILER_LAUNCHER "${CCACHE_EXECUTABLE}")
    endif()
endif()

if (NOT DEFINED ENABLE_CONAN)
    option(ENABLE_CONAN "Enable conan for dependency installation" OFF)
endif()

if (NOT DEFINED CONAN2)
    option(CONAN2 "Temp flag until we fully migrate to conan2" OFF)
endif()

option(BUILD_SHARED_LIB "Build a shared library" OFF)

option(POD5_DISABLE_TESTS "Disable building all tests" ON)
option(POD5_BUILD_EXAMPLES "Enable building all examples" OFF)

option(ENABLE_ADDRESS_SANITIZER "Enable address sanitizer" OFF)

if (NOT DEFINED ENABLE_POD5_PACKAGING)
    option(ENABLE_POD5_PACKAGING "Enable packaging support" ON)
endif()

option(BUILD_PYTHON_WHEEL "Build a python wheel for pod5" OFF)

# debug symbols don't depend on the build type, only on this option
option(DISABLE_DEBUG_SYMBOLS "Force debug symbols to be disabled" OFF)
if (NOT DISABLE_DEBUG_SYMBOLS)
    if (MSVC)
        # Z7 embeds deubgging info into .obj files, which is easier to manage for
        # build accelerators (note that a .pdb will still be generated for libs)
        # https://docs.microsoft.com/en-us/cpp/build/reference/z7-zi-zi-debug-information-format
        add_compile_options(/Z7)
        # this will use fastlink in the IDE and full link from the command link
        # https://docs.microsoft.com/en-us/cpp/build/reference/debug-generate-debug-info
        set(CMAKE_EXE_LINKER_FLAGS "${CMAKE_EXE_LINKER_FLAGS} /DEBUG")
        set(CMAKE_MODULE_LINKER_FLAGS "${CMAKE_EXE_LINKER_FLAGS} /DEBUG")
        set(CMAKE_SHARED_LINKER_FLAGS "${CMAKE_EXE_LINKER_FLAGS} /DEBUG")
        # /DEBUG option is not recognised for STATIC lib linking
    elseif (CMAKE_COMPILER_IS_GNUCXX OR CMAKE_CXX_COMPILER_ID MATCHES "Clang")
        add_compile_options(-g)
    endif()
endif()

option(ENABLE_FUZZERS "Build the fuzzers that can be used to catch new issues" OFF)
if (ENABLE_FUZZERS)
    include(pod5_fuzz)
endif()
add_compile_definitions(POD5_ENABLE_FUZZERS=$<BOOL:${ENABLE_FUZZERS}>)

option(ENABLE_COVERAGE_REPORT "Executables emit coverage reports" OFF)
if (ENABLE_COVERAGE_REPORT)
    if (DISABLE_DEBUG_SYMBOLS)
        message(FATAL_ERROR "Debug symbols are required for coverage reports to work")
    elseif (NOT CMAKE_BUILD_TYPE STREQUAL "Debug")
        message(FATAL_ERROR "Only unoptimised builds give reliable coverage reports")
    elseif (CMAKE_CXX_COMPILER_ID MATCHES "(GNU|Clang)")
        add_compile_options(--coverage)
        add_link_options(--coverage)
    else()
        message(FATAL_ERROR "Cannot enable coverage on unknown compiler")
    endif()
endif()


# FIXME: DISABLE CONDITIONAL TO WORK ON BIONIC
if (ENABLE_CONAN AND CMAKE_COMPILER_IS_GNUCXX AND
        CMAKE_CXX_COMPILER_VERSION VERSION_GREATER_EQUAL "9.0" AND
        CMAKE_CXX_COMPILER_VERSION VERSION_LESS "10.0")
    # We build POD5 on CentOS 7 in CI, where we have GCC 9 but only the pre-C++11 ABI
    # See https://gcc.gnu.org/onlinedocs/libstdc++/manual/using_dual_abi.html
    # This forces GCC 9 on other platforms (eg: Ubuntu Focal) to use the same ABI.
    # The main gain here is being able to use the same conan packages.
    add_compile_definitions(_GLIBCXX_USE_CXX11_ABI=0)
endif()

if(ENABLE_ADDRESS_SANITIZER)
    add_compile_options("-fsanitize=address")
    add_link_options("-fsanitize=address")
endif()

include_directories("third_party/include")

foreach (config "Release" "Debug")
    string(TOUPPER "${config}" config_upper)
    set(CMAKE_ARCHIVE_OUTPUT_DIRECTORY_${config_upper} ${CMAKE_BINARY_DIR}/${config}/lib)
    set(CMAKE_LIBRARY_OUTPUT_DIRECTORY_${config_upper} ${CMAKE_BINARY_DIR}/${config}/lib)
    set(CMAKE_RUNTIME_OUTPUT_DIRECTORY_${config_upper} ${CMAKE_BINARY_DIR}/${config}/bin)
endforeach()

set(CMAKE_INSTALL_DEFAULT_COMPONENT_NAME "archive")

include(GenerateExportHeader)

enable_testing()

if (BUILD_PYTHON_WHEEL)
    find_package(Python ${PYTHON_VERSION} EXACT COMPONENTS Interpreter Development)
    set(PYBIND11_FINDPYTHON ON)
    add_subdirectory(third_party/pybind11)
    install(
        FILES third_party/pybind11/LICENSE
        DESTINATION licenses
        RENAME pybind11.txt
    )
endif()

add_subdirectory(c++)

# The fuzz directory contains both the fuzzers and the regression runners,
# the latter of which can be built as ordinary tests.
if (ENABLE_FUZZERS OR NOT POD5_DISABLE_TESTS)
    add_subdirectory(fuzz)
endif()

# Install licenses.
install(
    DIRECTORY ${CMAKE_BINARY_DIR}/pod5_conan_licenses/
    DESTINATION licenses
)
install(
    FILES
        LICENSE.md
        third_party/licenses/gsl-lite.txt
    DESTINATION
        licenses
)

if (ENABLE_POD5_PACKAGING)
    include(pod5_packaging)
endif()


================================================
FILE: CMakePresets.json
================================================
{
    "version": 4,
    "include": [
        "cmake/presets/conan-provider.json",
        "cmake/presets/conan-build-options.json",
        "cmake/presets/conan-profiles.json"
    ],
    "configurePresets": [
        {
            "name": "conan2-linux-gcc9-x86_64-cppstd20-debug",
            "inherits": [
                "conan2-provider",
                "conan2-debug",
                "conan2-gcc9-x86_64-profile",
                "conan2-cppstd20"
            ]
        },
        {
            "name": "conan2-linux-gcc9-x86_64-cppstd20-release",
            "inherits": [
                "conan2-provider",
                "conan2-release",
                "conan2-gcc9-x86_64-profile",
                "conan2-cppstd20"
            ]
        },
        {
            "name": "conan2-linux-gcc9-x86_64-cppstd17-debug",
            "inherits": [
                "conan2-provider",
                "conan2-debug",
                "conan2-gcc9-x86_64-profile",
                "conan2-cppstd17"
            ]
        },
        {
            "name": "conan2-linux-gcc9-x86_64-cppstd17-release",
            "inherits": [
                "conan2-provider",
                "conan2-release",
                "conan2-gcc9-x86_64-profile",
                "conan2-cppstd17"
            ]
        },
        {
            "name": "conan2-linux-gcc13-x86_64-cppstd20-debug",
            "inherits": [
                "conan2-provider",
                "conan2-debug",
                "conan2-gcc13-x86_64-profile",
                "conan2-cppstd20"
            ]
        },
        {
            "name": "conan2-linux-gcc13-x86_64-cppstd20-release",
            "inherits": [
                "conan2-provider",
                "conan2-release",
                "conan2-gcc13-x86_64-profile",
                "conan2-cppstd20"
            ]
        },
        {
            "name": "conan2-linux-gcc13-x86_64-cppstd17-debug",
            "inherits": [
                "conan2-provider",
                "conan2-debug",
                "conan2-gcc13-x86_64-profile",
                "conan2-cppstd17"
            ]
        },
        {
            "name": "conan2-linux-gcc13-x86_64-cppstd17-release",
            "inherits": [
                "conan2-provider",
                "conan2-release",
                "conan2-gcc13-x86_64-profile",
                "conan2-cppstd17"
            ]
        },
        {
            "name": "conan2-linux-gcc11-x86_64-cppstd20-debug",
            "inherits": [
                "conan2-provider",
                "conan2-debug",
                "conan2-gcc11-x86_64-profile",
                "conan2-cppstd20"
            ]
        },
        {
            "name": "conan2-linux-gcc11-x86_64-cppstd20-release",
            "hidden": false,
            "inherits": [
                "conan2-provider",
                "conan2-release",
                "conan2-gcc11-x86_64-profile",
                "conan2-cppstd20"
            ]
        },
        {
            "name": "conan2-linux-gcc11-x86_64-cppstd17-debug",
            "inherits": [
                "conan2-provider",
                "conan2-debug",
                "conan2-gcc11-x86_64-profile",
                "conan2-cppstd17"
            ]
        },
        {
            "name": "conan2-linux-gcc11-x86_64-cppstd17-release",
            "inherits": [
                "conan2-provider",
                "conan2-release",
                "conan2-gcc11-x86_64-profile",
                "conan2-cppstd17"
            ]
        },
        {
            "name": "conan2-linux-gcc11-asan-static-x86_64-cppstd20-debug",
            "inherits": [
                "conan2-provider",
                "conan2-debug",
                "conan2-gcc11-asan-static-x86_64-profile",
                "conan2-cppstd20"
            ]
        },
        {
            "name": "conan2-linux-gcc11-asan-static-x86_64-cppstd20-release",
            "hidden": false,
            "inherits": [
                "conan2-provider",
                "conan2-release",
                "conan2-gcc11-asan-static-x86_64-profile",
                "conan2-cppstd20"
            ]
        },
        {
            "name": "conan2-linux-gcc11-usan-static-x86_64-cppstd20-debug",
            "inherits": [
                "conan2-provider",
                "conan2-debug",
                "conan2-gcc11-usan-static-x86_64-profile",
                "conan2-cppstd20"
            ]
        },
        {
            "name": "conan2-linux-gcc11-usan-static-x86_64-cppstd20-release",
            "hidden": false,
            "inherits": [
                "conan2-provider",
                "conan2-release",
                "conan2-gcc11-usan-static-x86_64-profile",
                "conan2-cppstd20"
            ]
        },
        {
            "name": "conan2-linux-gcc11-tsan-static-x86_64-cppstd20-debug",
            "inherits": [
                "conan2-provider",
                "conan2-debug",
                "conan2-gcc11-tsan-static-x86_64-profile",
                "conan2-cppstd20"
            ]
        },
        {
            "name": "conan2-linux-gcc11-tsan-static-x86_64-cppstd20-release",
            "hidden": false,
            "inherits": [
                "conan2-provider",
                "conan2-release",
                "conan2-gcc11-tsan-static-x86_64-profile",
                "conan2-cppstd20"
            ]
        },
        {
            "name": "conan2-linux-gcc11-asan-static-x86_64-cppstd17-debug",
            "inherits": [
                "conan2-provider",
                "conan2-debug",
                "conan2-gcc11-asan-static-x86_64-profile",
                "conan2-cppstd17"
            ]
        },
        {
            "name": "conan2-linux-gcc11-asan-static-x86_64-cppstd17-release",
            "hidden": false,
            "inherits": [
                "conan2-provider",
                "conan2-release",
                "conan2-gcc11-asan-static-x86_64-profile",
                "conan2-cppstd20"
            ]
        },
        {
            "name": "conan2-linux-gcc11-usan-static-x86_64-cppstd17-debug",
            "inherits": [
                "conan2-provider",
                "conan2-debug",
                "conan2-gcc11-usan-static-x86_64-profile",
                "conan2-cppstd17"
            ]
        },
        {
            "name": "conan2-linux-gcc11-usan-static-x86_64-cppstd17-release",
            "hidden": false,
            "inherits": [
                "conan2-provider",
                "conan2-release",
                "conan2-gcc11-usan-static-x86_64-profile",
                "conan2-cppstd17"
            ]
        },
        {
            "name": "conan2-linux-gcc11-tsan-static-x86_64-cppstd17-debug",
            "inherits": [
                "conan2-provider",
                "conan2-debug",
                "conan2-gcc11-tsan-static-x86_64-profile",
                "conan2-cppstd17"
            ]
        },
        {
            "name": "conan2-linux-gcc11-tsan-static-x86_64-cppstd17-release",
            "hidden": false,
            "inherits": [
                "conan2-provider",
                "conan2-release",
                "conan2-gcc11-tsan-static-x86_64-profile",
                "conan2-cppstd17"
            ]
        },
        {
            "name": "conan2-linux-gcc13-aarch64-cppstd20-debug",
            "inherits": [
                "conan2-provider",
                "conan2-debug",
                "conan2-gcc13-aarch64-profile",
                "conan2-cppstd20"
            ]
        },
        {
            "name": "conan2-linux-gcc13-aarch64-cppstd20-release",
            "inherits": [
                "conan2-provider",
                "conan2-release",
                "conan2-gcc13-aarch64-profile",
                "conan2-cppstd20"
            ]
        },
        {
            "name": "conan2-linux-gcc13-aarch64-cppstd17-debug",
            "inherits": [
                "conan2-provider",
                "conan2-debug",
                "conan2-gcc13-aarch64-profile",
                "conan2-cppstd17"
            ]
        },
        {
            "name": "conan2-linux-gcc13-aarch64-cppstd17-release",
            "inherits": [
                "conan2-provider",
                "conan2-release",
                "conan2-gcc13-aarch64-profile",
                "conan2-cppstd17"
            ]
        },
        {
            "name": "conan2-linux-gcc11-aarch64-cppstd20-debug",
            "inherits": [
                "conan2-provider",
                "conan2-debug",
                "conan2-gcc11-aarch64-profile",
                "conan2-cppstd20"
            ]
        },
        {
            "name": "conan2-linux-gcc11-aarch64-cppstd20-release",
            "hidden": false,
            "inherits": [
                "conan2-provider",
                "conan2-release",
                "conan2-gcc11-aarch64-profile",
                "conan2-cppstd20"
            ]
        },
        {
            "name": "conan2-linux-gcc11-aarch64-cppstd17-debug",
            "inherits": [
                "conan2-provider",
                "conan2-debug",
                "conan2-gcc11-aarch64-profile",
                "conan2-cppstd17"
            ]
        },
        {
            "name": "conan2-linux-gcc11-aarch64-cppstd17-release",
            "hidden": false,
            "inherits": [
                "conan2-provider",
                "conan2-release",
                "conan2-gcc11-aarch64-profile",
                "conan2-cppstd17"
            ]
        },
        {
            "name": "conan2-linux-gcc9-aarch64-cppstd17-debug",
            "inherits": [
                "conan2-provider",
                "conan2-debug",
                "conan2-gcc9-aarch64-profile",
                "conan2-cppstd17"
            ]
        },
        {
            "name": "conan2-linux-gcc9-aarch64-cppstd17-release",
            "inherits": [
                "conan2-provider",
                "conan2-release",
                "conan2-gcc9-aarch64-profile",
                "conan2-cppstd17"
            ]
        },
        {
            "name": "conan2-linux-gcc9-aarch64-cppstd20-debug",
            "inherits": [
                "conan2-provider",
                "conan2-debug",
                "conan2-gcc9-aarch64-profile",
                "conan2-cppstd20"
            ]
        },
        {
            "name": "conan2-linux-gcc9-aarch64-cppstd20-release",
            "inherits": [
                "conan2-provider",
                "conan2-release",
                "conan2-gcc9-aarch64-profile",
                "conan2-cppstd20"
            ]
        },
        {
            "name": "conan2-macos-appleclang-15.0-aarch64-cppstd17-debug",
            "inherits": [
                "conan2-provider",
                "conan2-debug",
                "conan2-appleclang-15.0-aarch64-profile",
                "conan2-cppstd17"
            ]
        },
        {
            "name": "conan2-macos-appleclang-15.0-aarch64-cppstd17-release",
            "inherits": [
                "conan2-provider",
                "conan2-release",
                "conan2-appleclang-15.0-aarch64-profile",
                "conan2-cppstd17"
            ]
        },
        {
            "name": "conan2-macos-appleclang-15.0-aarch64-cppstd20-debug",
            "inherits": [
                "conan2-provider",
                "conan2-debug",
                "conan2-appleclang-15.0-aarch64-profile",
                "conan2-cppstd20"
            ]
        },
        {
            "name": "conan2-macos-appleclang-15.0-aarch64-cppstd20-release",
            "inherits": [
                "conan2-provider",
                "conan2-release",
                "conan2-appleclang-15.0-aarch64-profile",
                "conan2-cppstd20"
            ]
        },
        {
            "name": "conan2-macos-appleclang-16.0-aarch64-cppstd17-debug",
            "inherits": [
                "conan2-provider",
                "conan2-debug",
                "conan2-appleclang-16.0-aarch64-profile",
                "conan2-cppstd17"
            ]
        },
        {
            "name": "conan2-macos-appleclang-16.0-aarch64-cppstd17-release",
            "inherits": [
                "conan2-provider",
                "conan2-release",
                "conan2-appleclang-16.0-aarch64-profile",
                "conan2-cppstd17"
            ]
        },
        {
            "name": "conan2-macos-appleclang-16.0-aarch64-cppstd20-debug",
            "inherits": [
                "conan2-provider",
                "conan2-debug",
                "conan2-appleclang-16.0-aarch64-profile",
                "conan2-cppstd20"
            ]
        },
        {
            "name": "conan2-macos-appleclang-16.0-aarch64-cppstd20-release",
            "inherits": [
                "conan2-provider",
                "conan2-release",
                "conan2-appleclang-16.0-aarch64-profile",
                "conan2-cppstd20"
            ]
        },
        {
            "name": "conan2-windows-x86_64-vs2019-cppstd17-debug",
            "inherits": [
                "conan2-provider",
                "conan2-debug",
                "conan2-windows-x86_64-vs2019-profile",
                "conan2-cppstd17"
            ]
        },
        {
            "name": "conan2-windows-x86_64-vs2019-cppstd17-release",
            "inherits": [
                "conan2-provider",
                "conan2-release",
                "conan2-windows-x86_64-vs2019-profile",
                "conan2-cppstd17"
            ]
        },
        {
            "name": "conan2-windows-x86_64-vs2019-cppstd20-debug",
            "inherits": [
                "conan2-provider",
                "conan2-debug",
                "conan2-windows-x86_64-vs2019-profile",
                "conan2-cppstd20"
            ]
        },
        {
            "name": "conan2-windows-x86_64-vs2019-cppstd20-release",
            "inherits": [
                "conan2-provider",
                "conan2-release",
                "conan2-windows-x86_64-vs2019-profile",
                "conan2-cppstd20"
            ]
        }
    ]
}


================================================
FILE: DEV.md
================================================
Development
===========

If you want to contribute to pod5_file_format, or our pre-built binaries do not meet your platform requirements, you can build pod5 from source using the instructions in `docs/install.rst`.

### Developing

Building the project requires several tools and libraries are available:

- CMake
- Arrow
- Zstd
- Flatbuffers
- Python
- setuptools_scm

```bash
# Docs on installing arrow from here: https://arrow.apache.org/install/
> sudo apt install -y -V ca-certificates lsb-release wget
> wget https://apache.jfrog.io/artifactory/arrow/$(lsb_release --id --short | tr 'A-Z' 'a-z')/apache-arrow-apt-source-latest-$(lsb_release --codename --short).deb
> sudo apt install -y -V ./apache-arrow-apt-source-latest-$(lsb_release --codename --short).deb
> sudo apt update
# Now install the rest of the dependencies:
> sudo apt install cmake libzstd-dev libzstd-dev libflatbuffers-dev libarrow-dev=12.0.1-1
> pip install setuptools_scm~=7.1
# Finally start build of POD5:
> git clone https://github.com/nanoporetech/pod5-file-format.git
> cd pod5-file-format
> git submodule update --init --recursive
> python -m setuptools_scm
> python ./pod5_make_version.py
> mkdir build
> cd build
> cmake ..
> make -j
```

### Pre commit

The project uses pre-commit to ensure code is consistently formatted, you can set this up using pip:

```bash
> pip install pre-commit==v2.21.0
# Install pre-commit hooks in your pod5-file-format repo:
> cd pod5-file-format
> pre-commit install
# Run hooks on all files:
> pre-commit run --all-files
```

Python Development
==================

After completing the required build stages above, to create a Python virtual environment for development follow the instructions below .

```bash

> cd python
> make install

```


================================================
FILE: LICENSE.md
================================================
This Source Code Form is subject to the terms of the Mozilla Public
License, v. 2.0. If a copy of the MPL was not distributed with this
file, You can obtain one at https://mozilla.org/MPL/2.0/.

©2021 Oxford Nanopore Technologies PLC.


Mozilla Public License Version 2.0
==================================

### 1. Definitions

**1.1. “Contributor”**
    means each individual or legal entity that creates, contributes to
    the creation of, or owns Covered Software.

**1.2. “Contributor Version”**
    means the combination of the Contributions of others (if any) used
    by a Contributor and that particular Contributor's Contribution.

**1.3. “Contribution”**
    means Covered Software of a particular Contributor.

**1.4. “Covered Software”**
    means Source Code Form to which the initial Contributor has attached
    the notice in Exhibit A, the Executable Form of such Source Code
    Form, and Modifications of such Source Code Form, in each case
    including portions thereof.

**1.5. “Incompatible With Secondary Licenses”**
    means

* **(a)** that the initial Contributor has attached the notice described
    in Exhibit B to the Covered Software; or
* **(b)** that the Covered Software was made available under the terms of
    version 1.1 or earlier of the License, but not also under the
    terms of a Secondary License.

**1.6. “Executable Form”**
    means any form of the work other than Source Code Form.

**1.7. “Larger Work”**
    means a work that combines Covered Software with other material, in
    a separate file or files, that is not Covered Software.

**1.8. “License”**
    means this document.

**1.9. “Licensable”**
    means having the right to grant, to the maximum extent possible,
    whether at the time of the initial grant or subsequently, any and
    all of the rights conveyed by this License.

**1.10. “Modifications”**
    means any of the following:

* **(a)** any file in Source Code Form that results from an addition to,
    deletion from, or modification of the contents of Covered
    Software; or
* **(b)** any new file in Source Code Form that contains any Covered
    Software.

**1.11. “Patent Claims” of a Contributor**
    means any patent claim(s), including without limitation, method,
    process, and apparatus claims, in any patent Licensable by such
    Contributor that would be infringed, but for the grant of the
    License, by the making, using, selling, offering for sale, having
    made, import, or transfer of either its Contributions or its
    Contributor Version.

**1.12. “Secondary License”**
    means either the GNU General Public License, Version 2.0, the GNU
    Lesser General Public License, Version 2.1, the GNU Affero General
    Public License, Version 3.0, or any later versions of those
    licenses.

**1.13. “Source Code Form”**
    means the form of the work preferred for making modifications.

**1.14. “You” (or “Your”)**
    means an individual or a legal entity exercising rights under this
    License. For legal entities, “You” includes any entity that
    controls, is controlled by, or is under common control with You. For
    purposes of this definition, “control” means **(a)** the power, direct
    or indirect, to cause the direction or management of such entity,
    whether by contract or otherwise, or **(b)** ownership of more than
    fifty percent (50%) of the outstanding shares or beneficial
    ownership of such entity.


### 2. License Grants and Conditions

#### 2.1. Grants

Each Contributor hereby grants You a world-wide, royalty-free,
non-exclusive license:

* **(a)** under intellectual property rights (other than patent or trademark)
    Licensable by such Contributor to use, reproduce, make available,
    modify, display, perform, distribute, and otherwise exploit its
    Contributions, either on an unmodified basis, with Modifications, or
    as part of a Larger Work; and
* **(b)** under Patent Claims of such Contributor to make, use, sell, offer
    for sale, have made, import, and otherwise transfer either its
    Contributions or its Contributor Version.

#### 2.2. Effective Date

The licenses granted in Section 2.1 with respect to any Contribution
become effective for each Contribution on the date the Contributor first
distributes such Contribution.

#### 2.3. Limitations on Grant Scope

The licenses granted in this Section 2 are the only rights granted under
this License. No additional rights or licenses will be implied from the
distribution or licensing of Covered Software under this License.
Notwithstanding Section 2.1(b) above, no patent license is granted by a
Contributor:

* **(a)** for any code that a Contributor has removed from Covered Software;
    or
* **(b)** for infringements caused by: **(i)** Your and any other third party's
    modifications of Covered Software, or **(ii)** the combination of its
    Contributions with other software (except as part of its Contributor
    Version); or
* **(c)** under Patent Claims infringed by Covered Software in the absence of
    its Contributions.

This License does not grant any rights in the trademarks, service marks,
or logos of any Contributor (except as may be necessary to comply with
the notice requirements in Section 3.4).

#### 2.4. Subsequent Licenses

No Contributor makes additional grants as a result of Your choice to
distribute the Covered Software under a subsequent version of this
License (see Section 10.2) or under the terms of a Secondary License (if
permitted under the terms of Section 3.3).

#### 2.5. Representation

Each Contributor represents that the Contributor believes its
Contributions are its original creation(s) or it has sufficient rights
to grant the rights to its Contributions conveyed by this License.

#### 2.6. Fair Use

This License is not intended to limit any rights You have under
applicable copyright doctrines of fair use, fair dealing, or other
equivalents.

#### 2.7. Conditions

Sections 3.1, 3.2, 3.3, and 3.4 are conditions of the licenses granted
in Section 2.1.


### 3. Responsibilities

#### 3.1. Distribution of Source Form

All distribution of Covered Software in Source Code Form, including any
Modifications that You create or to which You contribute, must be under
the terms of this License. You must inform recipients that the Source
Code Form of the Covered Software is governed by the terms of this
License, and how they can obtain a copy of this License. You may not
attempt to alter or restrict the recipients' rights in the Source Code
Form.

#### 3.2. Distribution of Executable Form

If You distribute Covered Software in Executable Form then:

* **(a)** such Covered Software must also be made available in Source Code
    Form, as described in Section 3.1, and You must inform recipients of
    the Executable Form how they can obtain a copy of such Source Code
    Form by reasonable means in a timely manner, at a charge no more
    than the cost of distribution to the recipient; and

* **(b)** You may distribute such Executable Form under the terms of this
    License, or sublicense it under different terms, provided that the
    license for the Executable Form does not attempt to limit or alter
    the recipients' rights in the Source Code Form under this License.

#### 3.3. Distribution of a Larger Work

You may create and distribute a Larger Work under terms of Your choice,
provided that You also comply with the requirements of this License for
the Covered Software. If the Larger Work is a combination of Covered
Software with a work governed by one or more Secondary Licenses, and the
Covered Software is not Incompatible With Secondary Licenses, this
License permits You to additionally distribute such Covered Software
under the terms of such Secondary License(s), so that the recipient of
the Larger Work may, at their option, further distribute the Covered
Software under the terms of either this License or such Secondary
License(s).

#### 3.4. Notices

You may not remove or alter the substance of any license notices
(including copyright notices, patent notices, disclaimers of warranty,
or limitations of liability) contained within the Source Code Form of
the Covered Software, except that You may alter any license notices to
the extent required to remedy known factual inaccuracies.

#### 3.5. Application of Additional Terms

You may choose to offer, and to charge a fee for, warranty, support,
indemnity or liability obligations to one or more recipients of Covered
Software. However, You may do so only on Your own behalf, and not on
behalf of any Contributor. You must make it absolutely clear that any
such warranty, support, indemnity, or liability obligation is offered by
You alone, and You hereby agree to indemnify every Contributor for any
liability incurred by such Contributor as a result of warranty, support,
indemnity or liability terms You offer. You may include additional
disclaimers of warranty and limitations of liability specific to any
jurisdiction.


### 4. Inability to Comply Due to Statute or Regulation

If it is impossible for You to comply with any of the terms of this
License with respect to some or all of the Covered Software due to
statute, judicial order, or regulation then You must: **(a)** comply with
the terms of this License to the maximum extent possible; and **(b)**
describe the limitations and the code they affect. Such description must
be placed in a text file included with all distributions of the Covered
Software under this License. Except to the extent prohibited by statute
or regulation, such description must be sufficiently detailed for a
recipient of ordinary skill to be able to understand it.


### 5. Termination

**5.1.** The rights granted under this License will terminate automatically
if You fail to comply with any of its terms. However, if You become
compliant, then the rights granted under this License from a particular
Contributor are reinstated **(a)** provisionally, unless and until such
Contributor explicitly and finally terminates Your grants, and **(b)** on an
ongoing basis, if such Contributor fails to notify You of the
non-compliance by some reasonable means prior to 60 days after You have
come back into compliance. Moreover, Your grants from a particular
Contributor are reinstated on an ongoing basis if such Contributor
notifies You of the non-compliance by some reasonable means, this is the
first time You have received notice of non-compliance with this License
from such Contributor, and You become compliant prior to 30 days after
Your receipt of the notice.

**5.2.** If You initiate litigation against any entity by asserting a patent
infringement claim (excluding declaratory judgment actions,
counter-claims, and cross-claims) alleging that a Contributor Version
directly or indirectly infringes any patent, then the rights granted to
You by any and all Contributors for the Covered Software under Section
2.1 of this License shall terminate.

**5.3.** In the event of termination under Sections 5.1 or 5.2 above, all
end user license agreements (excluding distributors and resellers) which
have been validly granted by You or Your distributors under this License
prior to termination shall survive termination.


### 6. Disclaimer of Warranty

> Covered Software is provided under this License on an “as is”
> basis, without warranty of any kind, either expressed, implied, or
> statutory, including, without limitation, warranties that the
> Covered Software is free of defects, merchantable, fit for a
> particular purpose or non-infringing. The entire risk as to the
> quality and performance of the Covered Software is with You.
> Should any Covered Software prove defective in any respect, You
> (not any Contributor) assume the cost of any necessary servicing,
> repair, or correction. This disclaimer of warranty constitutes an
> essential part of this License. No use of any Covered Software is
> authorized under this License except under this disclaimer.

### 7. Limitation of Liability

> Under no circumstances and under no legal theory, whether tort
> (including negligence), contract, or otherwise, shall any
> Contributor, or anyone who distributes Covered Software as
> permitted above, be liable to You for any direct, indirect,
> special, incidental, or consequential damages of any character
> including, without limitation, damages for lost profits, loss of
> goodwill, work stoppage, computer failure or malfunction, or any
> and all other commercial damages or losses, even if such party
> shall have been informed of the possibility of such damages. This
> limitation of liability shall not apply to liability for death or
> personal injury resulting from such party's negligence to the
> extent applicable law prohibits such limitation. Some
> jurisdictions do not allow the exclusion or limitation of
> incidental or consequential damages, so this exclusion and
> limitation may not apply to You.


### 8. Litigation

Any litigation relating to this License may be brought only in the
courts of a jurisdiction where the defendant maintains its principal
place of business and such litigation shall be governed by laws of that
jurisdiction, without reference to its conflict-of-law provisions.
Nothing in this Section shall prevent a party's ability to bring
cross-claims or counter-claims.


### 9. Miscellaneous

This License represents the complete agreement concerning the subject
matter hereof. If any provision of this License is held to be
unenforceable, such provision shall be reformed only to the extent
necessary to make it enforceable. Any law or regulation which provides
that the language of a contract shall be construed against the drafter
shall not be used to construe this License against a Contributor.


### 10. Versions of the License

#### 10.1. New Versions

Mozilla Foundation is the license steward. Except as provided in Section
10.3, no one other than the license steward has the right to modify or
publish new versions of this License. Each version will be given a
distinguishing version number.

#### 10.2. Effect of New Versions

You may distribute the Covered Software under the terms of the version
of the License under which You originally received the Covered Software,
or under the terms of any subsequent version published by the license
steward.

#### 10.3. Modified Versions

If you create software not governed by this License, and you want to
create a new license for such software, you may create and use a
modified version of this License if you rename the license and remove
any references to the name of the license steward (except to note that
such modified license differs from this License).

#### 10.4. Distributing Source Code Form that is Incompatible With Secondary Licenses

If You choose to distribute Source Code Form that is Incompatible With
Secondary Licenses under the terms of this version of the License, the
notice described in Exhibit B of this License must be attached.

## Exhibit A - Source Code Form License Notice

    This Source Code Form is subject to the terms of the Mozilla Public
    License, v. 2.0. If a copy of the MPL was not distributed with this
    file, You can obtain one at https://mozilla.org/MPL/2.0/.

If it is not possible or desirable to put the notice in a particular
file, then You may include the notice in a location (such as a LICENSE
file in a relevant directory) where a recipient would be likely to look
for such a notice.

You may add additional accurate notices of copyright ownership.

## Exhibit B - “Incompatible With Secondary Licenses” Notice

    This Source Code Form is "Incompatible With Secondary Licenses", as
    defined by the Mozilla Public License, v. 2.0.


================================================
FILE: README.md
================================================
[![Documentation Status](https://readthedocs.org/projects/pod5-file-format/badge/?version=latest)](https://pod5-file-format.readthedocs.io/)

POD5 File Format
================

POD5 File Format
================

POD5 is a file format for storing nanopore dna data in an easily accessible way.
The format is able to be written in a streaming manner which allows a sequencing
instrument to directly write the format.

Data in POD5 is stored using [Apache Arrow](https://github.com/apache/arrow), allowing
users to consume data in many languages using standard tools.

What does this project contain
------------------------------

This project contains a core library for reading and writing POD5 data, and a toolkit for
accessing this data in other languages.

Documentation
-------------

Full documentation is found at https://pod5-file-format.readthedocs.io/


Usage
-----

POD5 is also bundled as a python module for easy use in scripts, a user can install using:

```bash
> pip install pod5
```

This python module provides the python library to write custom scripts against.

Please see [examples](./python/pod5/examples) for documentation on using the library.

The `pod5` package also provides [a selection of tools](./python/pod5/README.md).


Design
------

For information about the design of POD5, see the [docs](./docs/README.md).

Development
-----------

If you want to contribute to pod5_file_format, or our pre-built binaries do not meet your platform requirements, you can build pod5 from source using the instructions in [DEV.md](DEV.md)


================================================
FILE: benchmarks/.gitignore
================================================
*/outputs/
image/*.whl


================================================
FILE: benchmarks/README.md
================================================
POD5 Benchmarks
==============

Building the benchmark environment
----------------------------------

To run benchmarks you first have to build the docker environment to run them:

```bash
> ./build.sh
```


Running a benchmark
-------------------

To run a benchmark, use the helper script to start the docker image:

```bash
> ./run_benchmark.sh convert ./path-to-source-files/
```


Benchmarking Results
--------------------

    Note preliminary results

    Results run on:
        0.0.16 POD5
        pyslow5 dev branch (commit 2643310a)

    Benchmark numbers are produced using a GridION.

    Note the benchmarks are run using python APIs, more work is required on C benchmarks.


## PCR Dataset

On dataset a PCR Zymo dataset PAM50264, on 10.4.1 e8.2 data (`pcr_zymo/20220419_1706_2E_PAM50264_3c6f33f1`):

### File sizes

| pod5   | blow5   | fast5   |
|--------|---------|---------|
| 37G    | 37G     | 52G     |

### Timings

|                                     | pod5       | blow5      | fast5      |
|-------------------------------------|------------|------------|------------|
| convert                             | 197.5 secs | 241.4 secs | Not Run    |
| find all read ids                   | 10.1 secs  | 1.8 secs   | 5.2 secs   |
| find all samples                    | 22.3 secs  | 82.5 secs  | 520.6 secs |
| find selected read ids read number  | 1.1 secs   | 5.8 secs   | 387.1 secs |
| find selected read ids sample count | 1.5 secs   | 5.7 secs   | 417.8 secs |
| find selected read ids samples      | 5.3 secs   | 6.4 secs   | 465.6 secs |

```* Note blow5 convert times include the index + merge operation```


## InterARTIC Dataset

Dataset available at:
https://github.com/Psy-Fer/interARTIC

### File sizes

| pod5   | blow5   | fast5   |
|--------|---------|---------|
| 3.3G   | 3.4G    | 6.9G    |

### Timings

|                                     | pod5      | blow5     | fast5     |
|-------------------------------------|-----------|-----------|-----------|
| convert                             | 28.6 secs | 21.0 secs | Not Run   |
| find all read ids                   | 0.5 secs  | 0.5 secs  | 0.7 secs  |
| find all samples                    | 3.0 secs  | 8.0 secs  | 73.5 secs |
| find selected read ids read number  | 0.4 secs  | 1.3 secs  | 29.3 secs |
| find selected read ids sample count | 0.6 secs  | 1.3 secs  | 30.4 secs |
| find selected read ids samples      | 1.4 secs  | 1.3 secs  | 37.8 secs |

```* Note blow5 convert times include the index + merge operation```


================================================
FILE: benchmarks/build.sh
================================================
#!/bin/bash

set -o errexit
set -o pipefail
set -o nounset
# set -o xtrace

script_dir=$( cd -- "$( dirname -- "${BASH_SOURCE[0]}" )" &> /dev/null && pwd )
cd "${script_dir}"

cd image/
docker build -t pod5-benchmark-base -f Dockerfile.base .


================================================
FILE: benchmarks/convert/run_blow5.sh
================================================
#!/bin/bash

input_dir=$1
output_dir=$2

./tools/fast5_to_single_blow5.sh "$input_dir" "$output_dir"


================================================
FILE: benchmarks/convert/run_pod5.sh
================================================
#!/bin/bash

input_dir=$1
output_dir=$2

pod5 convert fast5 "$input_dir" --output "$output_dir"


================================================
FILE: benchmarks/find_all_read_ids/run_blow5.sh
================================================
#!/bin/bash

input_dir=$1
output_dir=$2

tools/pyslow5_tests.py "${input_dir}"/blow5/*.blow5 "${output_dir}" get_all_read_ids


================================================
FILE: benchmarks/find_all_read_ids/run_fast5.sh
================================================
#!/bin/bash

input_dir=$1
output_dir=$2

tools/find_and_get_fast5.py "${input_dir}/fast5" "${output_dir}"


================================================
FILE: benchmarks/find_all_read_ids/run_pod5.sh
================================================
#!/bin/bash

input_dir=$1
output_dir=$2

./tools/find_and_get_pod5.py "${input_dir}/pod5" "${output_dir}"


================================================
FILE: benchmarks/find_all_samples/run_blow5.sh
================================================
#!/bin/bash

input_dir=$1
output_dir=$2

tools/pyslow5_tests.py "${input_dir}"/blow5/*.blow5 "${output_dir}" all_values --get-column samples


================================================
FILE: benchmarks/find_all_samples/run_fast5.sh
================================================
#!/bin/bash

input_dir=$1
output_dir=$2

tools/find_and_get_fast5.py "${input_dir}/fast5" "${output_dir}" --get-column samples


================================================
FILE: benchmarks/find_all_samples/run_pod5.sh
================================================
#!/bin/bash

input_dir=$1
output_dir=$2

./tools/find_and_get_pod5.py "${input_dir}/pod5" "${output_dir}" --get-column samples


================================================
FILE: benchmarks/find_selected_read_ids_read_number/run_blow5.sh
================================================
#!/bin/bash

input_dir=$1
output_dir=$2
full_output_dir=$3

tools/pyslow5_tests.py "${input_dir}"/blow5/*.blow5 "${output_dir}" sample_values --get-column read_number --select-ids "${full_output_dir}/selected_read_ids.csv"


================================================
FILE: benchmarks/find_selected_read_ids_read_number/run_fast5.sh
================================================
#!/bin/bash

input_dir=$1
output_dir=$2
full_output_dir=$3

tools/find_and_get_fast5.py "${input_dir}/fast5" "${output_dir}" --get-column read_number --select-ids "${full_output_dir}/selected_read_ids.csv"


================================================
FILE: benchmarks/find_selected_read_ids_read_number/run_pod5.sh
================================================
#!/bin/bash

input_dir=$1
type_output_dir=$2
full_output_dir=$3

./tools/find_and_get_pod5.py "${input_dir}/pod5" "${type_output_dir}" --get-column read_number --select-ids "${full_output_dir}/selected_read_ids.csv"


================================================
FILE: benchmarks/find_selected_read_ids_sample_count/run_blow5.sh
================================================
#!/bin/bash

input_dir=$1
output_dir=$2
full_output_dir=$3

tools/pyslow5_tests.py "${input_dir}"/blow5/*.blow5 "${output_dir}" sample_values --get-column sample_count --select-ids "${full_output_dir}/selected_read_ids.csv"


================================================
FILE: benchmarks/find_selected_read_ids_sample_count/run_fast5.sh
================================================
#!/bin/bash

input_dir=$1
output_dir=$2
full_output_dir=$3

tools/find_and_get_fast5.py "${input_dir}/fast5" "${output_dir}" --get-column sample_count --select-ids "${full_output_dir}/selected_read_ids.csv"


================================================
FILE: benchmarks/find_selected_read_ids_sample_count/run_pod5.sh
================================================
#!/bin/bash

input_dir=$1
type_output_dir=$2
full_output_dir=$3

./tools/find_and_get_pod5.py "${input_dir}/pod5" "${type_output_dir}" --get-column sample_count --select-ids "${full_output_dir}/selected_read_ids.csv"


================================================
FILE: benchmarks/find_selected_read_ids_samples/run_blow5.sh
================================================
#!/bin/bash

input_dir=$1
output_dir=$2
full_output_dir=$3

tools/pyslow5_tests.py "${input_dir}"/blow5/*.blow5 "${output_dir}" sample_values --get-column samples --select-ids "${full_output_dir}/selected_read_ids.csv"


================================================
FILE: benchmarks/find_selected_read_ids_samples/run_fast5.sh
================================================
#!/bin/bash

input_dir=$1
output_dir=$2
full_output_dir=$3

tools/find_and_get_fast5.py "${input_dir}/fast5" "${output_dir}" --get-column samples --select-ids "${full_output_dir}/selected_read_ids.csv"


================================================
FILE: benchmarks/find_selected_read_ids_samples/run_pod5.sh
================================================
#!/bin/bash

input_dir=$1
type_output_dir=$2
full_output_dir=$3

./tools/find_and_get_pod5.py "${input_dir}/pod5" "${type_output_dir}" --get-column samples --select-ids "${full_output_dir}/selected_read_ids.csv"


================================================
FILE: benchmarks/image/Dockerfile.base
================================================
FROM ubuntu:20.04

RUN apt update && apt install -y wget python3 python3-pip git libzstd-dev

RUN wget https://github.com/nanoporetech/vbz_compression/releases/download/v1.0.1/ont-vbz-hdf-plugin_1.0.1-1.focal_amd64.deb && apt install -y ./ont-vbz-hdf-plugin_1.0.1-1.focal_amd64.deb && rm ont-vbz-hdf-plugin_1.0.1-1.focal_amd64.deb

COPY ./requirements-benchmarks.txt /
RUN pip install -r /requirements-benchmarks.txt

COPY ./install_slow5.sh /
RUN /install_slow5.sh
ENV PATH="/slow5tools-v0.4.0/:$PATH"

RUN pip install numpy

COPY ./pod5*.whl /
RUN pip install *.whl && rm *.whl


================================================
FILE: benchmarks/image/install_slow5.sh
================================================
#!/bin/bash

set -e

: "${SLOW_5_TOOLS_VERSION:=v1.3.0}"
: "${SLOW_5_LIB_VERSION:=v1.3.1}"

apt update
apt install -y libzstd-dev libhdf5-dev

wget "https://github.com/hasindu2008/slow5tools/releases/download/${SLOW_5_TOOLS_VERSION}/slow5tools-${SLOW_5_TOOLS_VERSION}-release.tar.gz"
tar xvf "slow5tools-${SLOW_5_TOOLS_VERSION}-release.tar.gz"
rm "slow5tools-${SLOW_5_TOOLS_VERSION}-release.tar.gz"
(
    cd "slow5tools-${SLOW_5_TOOLS_VERSION}"
    ./configure
    make zstd=1 -j "$(nproc)"
)

# pyslow5 must be built with zstd support for fair comparison (otherwise default zlib is slower than zstd)
git clone -b "${SLOW_5_LIB_VERSION}" https://github.com/hasindu2008/slow5lib

(
    cd slow5lib/

    echo "Installing numpy"
    pip install numpy

    make pyslow5 -j "$(nproc)" 2> build_log.txt || (cat build_log.txt && exit)
    echo "Installing pyslow5"
    PYSLOW5_ZSTD=1 pip install dist/*.tar.gz

    # adding slow5 C API benchmarks
    make zstd=1 -j "$(nproc)" && test/bench/build.sh
)


================================================
FILE: benchmarks/image/requirements-benchmarks.txt
================================================
h5py
numpy
pandas
tabulate


================================================
FILE: benchmarks/run_benchmarks.py
================================================
#!/usr/bin/env python3
"""
Example usage:
```
> taskset -c 0-10 ./benchmarks/run_benchmarks.py ./input_files/ \
    ./benchmark-outputs/ --skip-to-benchmark find_all_samples
```
"""

import argparse
import json
import shutil
import subprocess
import time
from collections import namedtuple
from pathlib import Path

import tabulate

Benchmark = namedtuple(
    "Benchmark",
    ["name", "file_types", "checks", "input_benchmark", "pre_run", "post_run_fixup"],
)

BENCHMARK_ROOT = Path(__file__).resolve().parent

POD5_FILE_TYPE = "pod5"
BLOW5_FILE_TYPE = "blow5"
FAST5_FILE_TYPE = "fast5"
ALL_FILE_TYPES = [POD5_FILE_TYPE, BLOW5_FILE_TYPE, FAST5_FILE_TYPE]


def du(path):
    """disk usage in human readable format (e.g. '2,1GB')"""
    return subprocess.check_output(["du", "-sh", path]).split()[0].decode("utf-8")


def generate_report(input_dir, output_dir, timing_results):
    report = ""

    skipped_benchmarks = len(ALL_BENCHMARKS) - len(timing_results)

    skipped = ""
    if skipped_benchmarks != 0:
        skipped = f", skipped {skipped_benchmarks}"
    report += f"Ran {len(timing_results)} benchmarks{skipped}\n\n"
    report += f"Input data was {input_dir}\n\n"

    report += "File sizes\n"
    report += "----------\n\n"

    convert_output_dir = output_dir / "convert"
    sizes = []
    for file_type in ALL_FILE_TYPES:
        file_type_dir = convert_output_dir / file_type
        if file_type_dir.exists:
            sizes.append(du(file_type_dir))
        else:
            sizes.append("Not Run")
    report += (
        tabulate.tabulate([sizes], headers=ALL_FILE_TYPES, tablefmt="github") + "\n\n"
    )

    report += "Timings\n"
    report += "-------\n\n"
    results = []
    for benchmark in ALL_BENCHMARKS:
        row = [benchmark.name.replace("_", " ")]
        results.append(row)

        if benchmark.name in timing_results:
            timings = timing_results[benchmark.name]
            for file_type in ALL_FILE_TYPES:
                if file_type in timings:
                    row.append(f"{timings[file_type]:.1f} secs")
                else:
                    row.append("Not Run")
        else:
            for file_type in ALL_FILE_TYPES:
                row.append("Not Run")

    results_headers = [""] + ALL_FILE_TYPES
    report += (
        tabulate.tabulate(results, headers=results_headers, tablefmt="github") + "\n"
    )
    return report


def check_read_ids(benchmark, file_types, output_dir, only_format):
    if only_format is not None:
        print("Not checking read ids - only one format executed")
        return

    csv_check_files = []
    for file_type in file_types:
        csv_check_files.append(output_dir / file_type / "read_ids.csv")

    for a, b in zip(csv_check_files[1:], csv_check_files):
        subprocess.run(
            [BENCHMARK_ROOT / "tools" / "check_csvs_consistent.py", a, b], check=True
        )


def check_file_sizes(benchmark, file_types, output_dir, only_format):
    print("File sizes for output dir")
    subprocess.run(["du", "-sh"] + list(output_dir.glob("*")), check=True)


def copy_fast5_files(benchmark, input_dir, output_dir):
    shutil.copytree(input_dir, output_dir / "fast5")


def randomly_select_read_ids(benchmark, input_dir, output_dir):
    print("Randomly selecting read ids for benchmark")

    subprocess.run(
        [
            BENCHMARK_ROOT / "tools" / "find_and_get_pod5.py",
            input_dir / "pod5",
            output_dir,
        ],
        check=True,
    )
    subprocess.run(
        [
            BENCHMARK_ROOT / "tools" / "select-random-ids.py",
            output_dir / "read_ids.csv",
            output_dir / "selected_read_ids.csv",
            "--select-ratio",
            "0.1",
        ],
        check=True,
    )


ALL_BENCHMARKS = [
    Benchmark(
        "convert",
        [POD5_FILE_TYPE, BLOW5_FILE_TYPE],
        [check_file_sizes],
        input_benchmark=None,
        post_run_fixup=copy_fast5_files,
        pre_run=None,
    ),
    Benchmark(
        "find_all_read_ids",
        ALL_FILE_TYPES,
        [check_read_ids],
        input_benchmark="convert",
        post_run_fixup=None,
        pre_run=None,
    ),
    Benchmark(
        "find_all_samples",
        ALL_FILE_TYPES,
        [check_read_ids],
        input_benchmark="convert",
        post_run_fixup=None,
        pre_run=None,
    ),
    Benchmark(
        "find_selected_read_ids_read_number",
        ALL_FILE_TYPES,
        [check_read_ids],
        input_benchmark="convert",
        post_run_fixup=None,
        pre_run=randomly_select_read_ids,
    ),
    Benchmark(
        "find_selected_read_ids_sample_count",
        ALL_FILE_TYPES,
        [check_read_ids],
        input_benchmark="convert",
        post_run_fixup=None,
        pre_run=randomly_select_read_ids,
    ),
    Benchmark(
        "find_selected_read_ids_samples",
        ALL_FILE_TYPES,
        [check_read_ids],
        input_benchmark="convert",
        post_run_fixup=None,
        pre_run=randomly_select_read_ids,
    ),
]


def run_benchmark(benchmark, input_dir, output_dir, only_format=None):
    if output_dir.exists():
        print("Removing old output dir")
        shutil.rmtree(output_dir)

    file_types = benchmark.file_types if benchmark.file_types else ALL_FILE_TYPES

    time_results = {}

    if benchmark.pre_run:
        benchmark.pre_run(benchmark, input_dir, output_dir)

    for file_type in file_types:
        if only_format is not None and only_format != file_type:
            print(f"## Skipping for file type {file_type}:")
            continue
        print(f"## Running for file type {file_type}:")
        file_type_output_dir = output_dir / file_type
        file_type_output_dir.mkdir(exist_ok=True, parents=True)
        start = time.time()
        subprocess.run(
            [
                BENCHMARK_ROOT / benchmark.name / f"run_{file_type}.sh",
                input_dir,
                file_type_output_dir,
                output_dir,
            ],
            check=True,
            cwd=BENCHMARK_ROOT,
        )
        end = time.time()
        duration_secs = end - start
        time_results[file_type] = duration_secs
        print(f"## Took {duration_secs:.2f} seconds")

    if benchmark.post_run_fixup:
        benchmark.post_run_fixup(benchmark, input_dir, output_dir)

    if benchmark.checks:
        print("## Running checks")
        for check in benchmark.checks:
            check(benchmark, file_types, output_dir, only_format)

    return time_results


def run_benchmarks(args):
    timing_results = {}

    input_dir = args.input_dir.resolve()
    output_dir = args.output_dir.resolve()

    skip_list = []
    if args.skip_to_benchmark:
        found = False
        for benchmark in ALL_BENCHMARKS:
            if benchmark.name == args.skip_to_benchmark:
                found = True

            if not found:
                skip_list.append(benchmark.name)

    for benchmark in ALL_BENCHMARKS:
        if benchmark.name in skip_list:
            print(f"# Skipping benchmark {benchmark.name}")
            continue
        print(f"# Running benchmark {benchmark.name}:")
        benchmark_input_dir = input_dir
        if benchmark.input_benchmark:
            benchmark_input_dir = output_dir / benchmark.input_benchmark
        timing_results[benchmark.name] = run_benchmark(
            benchmark,
            benchmark_input_dir,
            output_dir / benchmark.name,
            args.only_format,
        )

    report = generate_report(input_dir, output_dir, timing_results)
    print(report)

    with open(args.output_dir / "timings.json", "w") as f:
        f.write(json.dumps(timing_results, indent=2))
    with open(args.output_dir / "report.md", "w") as f:
        f.write(report)


def main():
    parser = argparse.ArgumentParser("Run Benchmarks for POD5 format")
    parser.add_argument("input_dir", type=Path)
    parser.add_argument("output_dir", type=Path)
    parser.add_argument(
        "--skip-to-benchmark",
        type=str,
        help="Start benchmarking from a named benchmark",
    )
    parser.add_argument(
        "--only-format",
        type=str,
        help="Only run benchmarks for a single format",
    )

    args = parser.parse_args()

    run_benchmarks(args)


if __name__ == "__main__":
    main()


================================================
FILE: benchmarks/run_benchmarks_in_docker.sh
================================================
#!/bin/bash

set -e

input_dir=$(readlink -f "$1")
output_dir="$(pwd)/pod5-benchmark-outputs"
mkdir -p "${output_dir}"

script_dir=$( cd -- "$( dirname -- "${BASH_SOURCE[0]}" )" &> /dev/null && pwd )

echo "Running benchmark on input '${input_dir}'"

docker run --rm -it -v"${input_dir}":/input -v"${output_dir}":/outputs -v"${script_dir}"/:/benchmarks pod5-benchmark-base /benchmarks/tools/run_benchmarks_docker_entry.sh


================================================
FILE: benchmarks/tools/check_csvs_consistent.py
================================================
#!/usr/bin/env python3

import argparse
import sys

import pandas as pd
from pandas.testing import assert_frame_equal


def check_consistency(df1, df2):
    df1 = df1.sort_values("read_id", ignore_index=True)
    df2 = df2.sort_values("read_id", ignore_index=True)

    assert_frame_equal(df1, df2)

    print("Data frames are consistent")
    sys.exit(0)


def main():
    parser = argparse.ArgumentParser()
    parser.add_argument("input_a")
    parser.add_argument("input_b")

    args = parser.parse_args()

    a = pd.read_csv(args.input_a)
    b = pd.read_csv(args.input_b)

    print(f"Check consistency of files {args.input_a} and {args.input_b}")
    check_consistency(a, b)


if __name__ == "__main__":
    main()


================================================
FILE: benchmarks/tools/fast5_to_single_blow5.sh
================================================
#!/bin/bash

input_path=$1
output_path=$2

mkdir -p "$output_path"

temp_dir="${output_path}/tmp"
mkdir -p "$temp_dir"

# specific options (-c zstd -s svb-zd) must be provided to slow5tools to create compression comparable to vbz
# also number of processes/threads must be set to 10 to match with default value in pod5_convert
# however, the svb-zd stream variable byte + zig-zag delta implementation in slow5 mirrors
# ONT's previous 32 bit zigzag delta, where as pod5 is using a newer 16 bit zigzag delta with SIMD optimisations
# so pod5 has the added performance benefit of using the newer zigzag delta
# slow5 compression methods are modular, so we can easily add the new one iff necessary
slow5tools f2s "$input_path" -d "$temp_dir" -p 10 -c zstd -s svb-zd

# Most comparable to have one file for both formats:
slow5tools cat "$temp_dir -o $output_path/file.blow5" || slow5tools merge "$temp_dir" -o "$output_path/file.blow5" -t 10 -c zstd -s svb-zd
#if the files are from the same run ID, slow5tools cat can be used, which is significantly faster
#slow5tools cat $temp_dir -o $output_path/file.blow5

rm -r "$temp_dir"

# Index will get generated on first test anyway, we should do it now to give best results later:
# current slow5tools implementation decompresses the whole record for indexing and is not efficient
# the specification supports partial decompress of the record (also signal chunking if necessary)
slow5tools index "$output_path/file.blow5"


================================================
FILE: benchmarks/tools/find_and_get_fast5.py
================================================
#!/usr/bin/env python3

import argparse
from pathlib import Path

import h5py
import numpy
import pandas as pd


def select_reads(file, selection):
    if selection is not None:
        for read in selection:
            path = f"/read_{read}"
            if path not in file:
                continue
            yield read, path
    else:
        for key in file.keys():
            if key.startswith("read_"):
                yield key[5:], key


def run(input_dir, output, select_read_ids=None, get_columns=[]):
    output.mkdir(parents=True, exist_ok=True)

    if select_read_ids is not None:
        print(f"Selecting {len(select_read_ids)} specific read ids")
    if get_columns is not None:
        print(f"Selecting columns: {get_columns}")

    read_ids = []
    extracted_columns = {"read_id": read_ids}
    print(f"Search for input files in {input_dir}")
    for file in input_dir.glob("*.fast5"):
        print(f"Searching for reads in {file}")

        file = h5py.File(file, "r")

        for read_id, read_path in select_reads(file, select_read_ids):
            read_ids.append(read_id)

            for c in get_columns:
                if c not in extracted_columns:
                    extracted_columns[c] = []
                col = extracted_columns[c]

                if c == "read_number":
                    col.append(file[f"{read_path}/Raw"].attrs["read_number"])
                elif c == "sample_count":
                    col.append(len(file[f"{read_path}/Raw"]["Signal"]))
                elif c == "samples":
                    col.append(numpy.sum(file[f"{read_path}/Raw"]["Signal"]))

    df = pd.DataFrame(extracted_columns)
    print(f"Selected {len(read_ids)} items")
    df.to_csv(output / "read_ids.csv", index=False)


def main():
    parser = argparse.ArgumentParser()
    parser.add_argument("input", type=Path)
    parser.add_argument("output", type=Path)
    parser.add_argument(
        "--select-ids",
        type=str,
        help="CSV file with a read_id column, listing ids to find in input files",
    )
    parser.add_argument(
        "--get-column",
        default=[],
        nargs="+",
        type=str,
        help="Add columns that should be extracted",
    )

    args = parser.parse_args()

    select_read_ids = None
    if args.select_ids:
        select_read_ids = pd.read_csv(args.select_ids)["read_id"]

    run(
        args.input,
        args.output,
        select_read_ids=select_read_ids,
        get_columns=args.get_column,
    )


if __name__ == "__main__":
    main()


================================================
FILE: benchmarks/tools/find_and_get_pod5.py
================================================
#!/usr/bin/env python3

import argparse
import multiprocessing as mp
import tempfile
from collections import namedtuple
from pathlib import Path
from queue import Empty

import numpy
import pandas as pd

import pod5 as p5

SelectReadIdsData = namedtuple(
    "SelectReadIdsData", ["path", "slice_start", "slice_end", "shape"]
)


def load_mapped_ids(select_read_ids_data):
    """Load a set of read ids from a mmapped file on disk"""
    select_read_ids_all = numpy.memmap(
        select_read_ids_data.path,
        dtype=numpy.uint8,
        mode="r+",
        shape=select_read_ids_data.shape,
    )
    return select_read_ids_all[
        select_read_ids_data.slice_start : select_read_ids_data.slice_end
    ]


def do_batch_work(filename, batches, column, mode, result_q):
    """
    Per process worker to do loading of data from a set of batches
    """

    read_ids = []
    vals = []
    extracted_columns = {"read_id": read_ids, column: vals}

    if column == "samples":
        file = p5.Reader(filename)
        for batch in file.read_batches(batch_selection=batches, preload={"samples"}):
            read_ids.extend(p5.format_read_ids(batch.read_id_column))

            for read in batch.reads():
                vals.append(numpy.sum(read.signal))
    else:
        print(f"Unknown column {column}")
    result_q.put(pd.DataFrame(extracted_columns))


def do_search_work(files, select_read_ids_data, column, mode, result_q):
    """
    Per process worker to do loading of data from a number of read ids
    """
    select_read_ids = load_mapped_ids(select_read_ids_data)

    read_ids = []
    vals = []
    extracted_columns = {"read_id": read_ids, column: vals}

    if column == "samples":
        for filename in files:
            file = p5.Reader(filename)
            for batch in file.read_batches(select_read_ids, preload={"samples"}):
                read_ids.extend(p5.format_read_ids(batch.read_id_column))
                vals.extend([numpy.sum(s) for s in batch.cached_samples_column])
    else:
        print(f"Unknown column {column}")
    result_q.put(pd.DataFrame(extracted_columns))


def run_multiprocess(files, output, select_read_ids=None, column=None, mode=None):
    """
    Do work across a number of python multiprocesses
    """
    mp.set_start_method("spawn")

    if select_read_ids is not None:
        print("Placing select read id data on disk for mmapping:")
        numpy_select_read_ids = p5.pack_read_ids(select_read_ids)

        # Copy data to memory-map
        fp = tempfile.NamedTemporaryFile()
        fp.close()
        mapped_select_read_ids = numpy.memmap(
            fp.name, dtype=numpy.uint8, mode="w+", shape=numpy_select_read_ids.shape
        )
        numpy.copyto(mapped_select_read_ids, numpy_select_read_ids)
        select_read_ids_mmap_path = Path(fp.name)

    result_queue = mp.Queue()
    runners = 10

    processes = []
    if select_read_ids is not None:
        approx_chunk_size = max(1, len(select_read_ids) // runners)
        start_index = 0
        while start_index < len(select_read_ids):
            select_read_ids_data = SelectReadIdsData(
                select_read_ids_mmap_path,
                start_index,
                start_index + approx_chunk_size,
                numpy_select_read_ids.shape,
            )

            p = mp.Process(
                target=do_search_work,
                args=(files, select_read_ids_data, column, mode, result_queue),
            )
            p.start()
            processes.append(p)
            start_index += approx_chunk_size
    else:
        for filename in files:
            file = p5.Reader(filename)
            batches = list(range(file.batch_count))
            approx_chunk_size = max(1, len(batches) // runners)
            start_index = 0
            while start_index < len(batches):
                select_batches = batches[start_index : start_index + approx_chunk_size]
                p = mp.Process(
                    target=do_batch_work,
                    args=(filename, select_batches, column, mode, result_queue),
                )
                p.start()
                processes.append(p)
                start_index += len(select_batches)

    print("Wait for processes...")

    items = []
    while len(items) < len(processes):
        try:
            item = result_queue.get(timeout=0.5)
            items.append(item)
        except Empty:
            continue

    for p in processes:
        p.join()

    return pd.concat(items)

    if select_read_ids is not None:
        select_read_ids_mmap_path.unlink()


def run_get_read_ids(files):
    """
    Load all read ids from the file.
    """
    read_ids = []
    for filename in files:
        file = p5.Reader(filename)
        for batch in file.read_batches():
            read_ids.extend(p5.format_read_ids(batch.read_id_column))
    return pd.DataFrame({"read_id": read_ids})


def run_select(files, select_read_ids, column):
    """
    Load column from a specific set of read ids
    """
    read_ids = []
    vals = []
    extracted_columns = {"read_id": read_ids, column: vals}

    for filename in files:
        file = p5.Reader(filename)
        if column == "sample_count":
            for batch in file.read_batches(select_read_ids, preload={"sample_count"}):
                read_id_selection = batch.read_id_column
                read_ids.extend(p5.format_read_ids(read_id_selection))
                vals.extend(batch.cached_sample_count_column)
        else:
            col_name = f"{column}_column"
            for batch in file.read_batches(select_read_ids):
                read_id_selection = batch.read_id_column
                read_ids.extend(p5.format_read_ids(read_id_selection))

                read_number_selection = getattr(batch, col_name)
                vals.extend(read_number_selection)

    return pd.DataFrame(extracted_columns)


def run_batched(files, column):
    """
    Load column from a all reads
    """
    read_ids = []
    vals = []
    extracted_columns = {"read_id": read_ids, column: vals}

    for filename in files:
        file = p5.Reader(filename)
        if column == "sample_count":
            for batch in file.read_batches(preload={"sample_count"}):
                read_ids.extend(p5.format_read_ids(batch.read_id_column))
                vals.extend(batch.cached_sample_count_column)
        else:
            col_name = f"{column}_column"
            for batch in file.read_batches():
                read_ids.extend(p5.format_read_ids(batch.read_id_column))
                vals.extend(getattr(batch, col_name).to_numpy())

    return pd.DataFrame(extracted_columns)


def main():
    parser = argparse.ArgumentParser()
    parser.add_argument("input", type=Path)
    parser.add_argument("output", type=Path)
    parser.add_argument(
        "--select-ids",
        type=str,
        help="CSV file with a read_id column, listing ids to find in input files",
    )
    parser.add_argument(
        "--get-column",
        default=None,
        type=str,
        help="Add column that should be extracted",
    )
    args = parser.parse_args()

    select_read_ids = None
    if args.select_ids:
        select_read_ids = pd.read_csv(args.select_ids)["read_id"]

    if select_read_ids is not None:
        print(f"Selecting {len(select_read_ids)} specific read ids")
    if args.get_column is not None:
        print(f"Selecting column: {args.get_column}")

    mode = None

    print(f"Search for input files in {args.input}")
    files = list(args.input.glob("*.pod5"))
    print(f"Searching in {[str(f) for f in files]}")

    # Run benchmark using most appropriate method:
    if args.get_column is None:
        df = run_get_read_ids(files)
    elif args.get_column == "samples":
        # Because we the "samples" column to be the sum
        # of all samples in input data, it is quicker to use
        # python multiprocessing to split the summing work:
        df = run_multiprocess(
            files,
            args.output,
            select_read_ids=select_read_ids,
            column=args.get_column,
            mode=mode,
        )
    elif args.select_ids:
        df = run_select(
            files,
            select_read_ids=select_read_ids,
            column=args.get_column,
        )
    else:
        df = run_batched(
            files,
            column=args.get_column,
        )

    print(f"Selected {len(df)} items")
    args.output.mkdir(parents=True, exist_ok=True)
    df.to_csv(args.output / "read_ids.csv", index=False)


if __name__ == "__main__":
    main()


================================================
FILE: benchmarks/tools/pyslow5_tests.py
================================================
#!/usr/bin/env python3

import argparse
import multiprocessing as mp
from pathlib import Path
from queue import Empty

import numpy
import pandas as pd
import pyslow5


def random_access(s5_file, read_list, col, result_q):
    file = pyslow5.Open(str(s5_file), "r")
    print("processing ", s5_file)
    read_ids = []
    extracted_columns = {"read_id": read_ids}
    extracted_columns[col] = []
    vals = extracted_columns[col]
    if col == "samples":
        for read in file.get_read_list_multi(read_list, threads=10, batchsize=5000):
            read_ids.append(read["read_id"])
            vals.append(numpy.sum(read["signal"]))
    elif col == "sample_count":
        for read in file.get_read_list_multi(read_list, threads=10, batchsize=5000):
            read_ids.append(read["read_id"])
            vals.append(read["len_raw_signal"])
    else:
        for read in file.get_read_list_multi(
            read_list, threads=10, batchsize=5000, pA=False, aux=col
        ):
            read_ids.append(read["read_id"])
            vals.append(read[col])
    result_q.put(pd.DataFrame(extracted_columns))


def run(s5_file, benchmark, select_read_ids, col):
    if benchmark == "get_all_read_ids":
        read_ids = []
        extracted_columns = {"read_id": read_ids}
        file = pyslow5.Open(str(s5_file), "r")
        print("processing ", s5_file)
        read_ids, num_reads = file.get_read_ids()
        extracted_columns = {"read_id": read_ids}

    elif benchmark == "sample_values":
        mp.set_start_method("spawn")
        result_queue = mp.Queue()
        runners = 10
        processes = []
        approx_chunk_size = max(1, len(select_read_ids) // runners)
        select_ids = []
        for i in range(0, len(select_read_ids), approx_chunk_size):
            for j in range(i, min(len(select_read_ids), i + approx_chunk_size)):
                select_ids.append(select_read_ids[j])
            p = mp.Process(
                target=random_access, args=(s5_file, select_ids, col, result_queue)
            )
            p.start()
            processes.append(p)
            select_ids = []

        print("Wait for processes...")
        items = []
        while len(items) < len(processes):
            try:
                item = result_queue.get(timeout=0.5)
                items.append(item)
            except Empty:
                continue

        for p in processes:
            p.join()

        df = pd.concat(items)
        return df

    elif benchmark == "all_values":
        read_ids = []
        extracted_columns = {"read_id": read_ids}
        file = pyslow5.Open(str(s5_file), "r")
        print("processing ", s5_file)
        extracted_columns[col] = []
        vals = extracted_columns[col]
        if col == "samples":
            for read in file.seq_reads_multi(threads=10, batchsize=5000):
                read_ids.append(read["read_id"])
                vals.append(numpy.sum(read["signal"]))
        elif col == "sample_count":
            for read in file.seq_reads_multi(threads=10, batchsize=5000):
                read_ids.append(read["read_id"])
                vals.append(read["len_raw_signal"])
        else:
            for read in file.seq_reads_multi(
                threads=10, batchsize=5000, pA=False, aux=col
            ):
                read_ids.append(read["read_id"])
                vals.append(read[col])

    return pd.DataFrame(extracted_columns)


def main():
    parser = argparse.ArgumentParser()
    parser.add_argument("input", type=Path)
    parser.add_argument("output", type=Path)
    parser.add_argument(
        "benchmark",
        type=str,
        choices=["get_all_read_ids", "sample_values", "all_values"],
        help="which benchmark to run",
    )
    parser.add_argument(
        "--select-ids",
        type=str,
        help="CSV file with a read_id column, listing ids to find in input files",
    )
    parser.add_argument(
        "--get-column",
        default=None,
        type=str,
        help="Add columns that should be extracted",
    )

    args = parser.parse_args()

    args.output.mkdir(parents=True, exist_ok=True)
    select_read_ids = None
    select_reads = []
    if args.select_ids:
        select_read_ids = pd.read_csv(args.select_ids)["read_id"]
        for i in select_read_ids:
            select_reads.append(i)

    print(f"Num of select_reads: {len(select_reads)}")

    df = run(
        args.input,
        args.benchmark,
        select_read_ids=select_reads,
        col=args.get_column,
    )
    print(f"Selected {len(df)} items")
    df.to_csv(args.output / "read_ids.csv", index=False)


if __name__ == "__main__":
    main()


================================================
FILE: benchmarks/tools/run_benchmarks_docker_entry.sh
================================================
#!/bin/bash

# Use taskset to limit benchmarks to specific cores, ensuring a fair test of limited resources:
taskset -c 0-10 /benchmarks/run_benchmarks.py /input /outputs


================================================
FILE: benchmarks/tools/select-random-ids.py
================================================
#!/usr/bin/env python3

import argparse
from pathlib import Path

import pandas as pd


def main():
    parser = argparse.ArgumentParser()
    parser.add_argument("input_csv", type=Path)
    parser.add_argument("output_csv", type=Path)
    parser.add_argument("--select-ratio", type=float)

    args = parser.parse_args()

    df = pd.read_csv(args.input_csv)

    selected_rows_df = df.sample(frac=args.select_ratio)

    args.output_csv.parent.mkdir(parents=True, exist_ok=True)
    selected_rows_df.to_csv(args.output_csv)


if __name__ == "__main__":
    main()


================================================
FILE: c++/CMakeLists.txt
================================================


if (ENABLE_CONAN)
    find_package(Arrow REQUIRED CONFIG)
    find_package(Flatbuffers REQUIRED CONFIG)
    find_package(zstd REQUIRED CONFIG)
    find_package(ZLIB REQUIRED CONFIG)

    if (${CMAKE_SYSTEM_NAME} STREQUAL "Linux")
        find_package(jemalloc REQUIRED CONFIG)
    endif()
else()
    find_package(Arrow REQUIRED)
    find_package(Flatbuffers REQUIRED)
    find_package(zstd REQUIRED)
    find_package(ZLIB REQUIRED)

    # Our non-conan ubuntu CI build has a different name for this target
    if (NOT CONAN2)
        add_library(arrow::arrow INTERFACE IMPORTED)
        target_link_libraries(arrow::arrow INTERFACE Arrow::arrow_shared)
    endif()
endif()

find_package(Threads REQUIRED)

find_program(
    FLATBUFFERS_FLATC_EXECUTABLE
    flatc
)
include(BuildFlatBuffers)

configure_file(
    pod5_format/version.h.in
    pod5_format/version.h
)

set(pod5_library_type STATIC)
if (BUILD_SHARED_LIB)
    set(pod5_library_type SHARED)
endif()

add_library(pod5_format ${pod5_library_type}
    pod5_format/file_recovery.h
    pod5_format/file_writer.cpp
    pod5_format/file_writer.h
    pod5_format/file_reader.cpp
    pod5_format/file_reader.h
    pod5_format/file_updater.cpp
    pod5_format/file_updater.h

    pod5_format/async_signal_loader.cpp
    pod5_format/async_signal_loader.h

    pod5_format/schema_metadata.cpp
    pod5_format/table_reader.h
    pod5_format/schema_field_builder.h

    pod5_format/read_table_reader.cpp
    pod5_format/read_table_reader.h
    pod5_format/read_table_schema.cpp
    pod5_format/read_table_schema.h
    pod5_format/read_table_writer.cpp
    pod5_format/read_table_writer.h
    pod5_format/read_table_writer_utils.cpp
    pod5_format/read_table_writer_utils.h
    pod5_format/read_table_utils.cpp
    pod5_format/read_table_utils.h

    pod5_format/run_info_table_reader.cpp
    pod5_format/run_info_table_reader.h
    pod5_format/run_info_table_schema.cpp
    pod5_format/run_info_table_schema.h
    pod5_format/run_info_table_writer.cpp
    pod5_format/run_info_table_writer.h

    pod5_format/signal_compression.cpp
    pod5_format/signal_compression.h
    pod5_format/signal_table_reader.cpp
    pod5_format/signal_table_reader.h
    pod5_format/signal_table_schema.cpp
    pod5_format/signal_table_schema.h
    pod5_format/signal_table_writer.cpp
    pod5_format/signal_table_writer.h
    pod5_format/signal_table_utils.h
    pod5_format/signal_builder.h

    pod5_format/c_api.cpp
    pod5_format/c_api.h

    pod5_format/expandable_buffer.h
    pod5_format/io_manager.cpp
    pod5_format/io_manager.h
    pod5_format/memory_pool.cpp
    pod5_format/memory_pool.h
    pod5_format/result.h
    pod5_format/schema_utils.cpp
    pod5_format/schema_utils.h
    pod5_format/table_reader.cpp
    pod5_format/table_reader.h
    pod5_format/thread_pool.cpp
    pod5_format/thread_pool.h
    pod5_format/tuple_utils.h
    pod5_format/types.cpp
    pod5_format/types.h
    pod5_format/uuid.h

    pod5_format/migration/migration.cpp
    pod5_format/migration/migration.h
    pod5_format/migration/migration_utils.h
    pod5_format/migration/v0_to_v1.cpp
    pod5_format/migration/v1_to_v2.cpp
    pod5_format/migration/v2_to_v3.cpp
    pod5_format/migration/v3_to_v4.cpp

    pod5_format/internal/async_output_stream.h
    pod5_format/internal/combined_file_utils.h
    pod5_format/internal/linux_output_stream.h

    pod5_format/svb16/common.hpp
    pod5_format/svb16/decode.hpp
    pod5_format/svb16/decode_scalar.hpp
    pod5_format/svb16/decode_x64.hpp
    pod5_format/svb16/encode.hpp
    pod5_format/svb16/encode_scalar.hpp
    pod5_format/svb16/encode_x64.hpp
    pod5_format/svb16/intrinsics.hpp
    pod5_format/svb16/shuffle_tables.hpp
    pod5_format/svb16/simd_detect_x64.hpp
)

set(public_headers)
list(APPEND public_headers
    pod5_format/file_writer.h
    pod5_format/file_reader.h

    pod5_format/schema_metadata.h

    pod5_format/read_table_reader.h
    pod5_format/read_table_schema.h
    pod5_format/read_table_writer.h
    pod5_format/read_table_writer_utils.h
    pod5_format/read_table_utils.h

    pod5_format/run_info_table_writer.h
    pod5_format/run_info_table_reader.h
    pod5_format/run_info_table_schema.h

    pod5_format/signal_compression.h
    pod5_format/signal_table_reader.h
    pod5_format/signal_table_schema.h
    pod5_format/signal_table_writer.h
    pod5_format/signal_table_utils.h
    pod5_format/signal_builder.h
    pod5_format/uuid.h

    pod5_format/c_api.h

    pod5_format/expandable_buffer.h
    pod5_format/file_output_stream.h
    pod5_format/io_manager.h
    pod5_format/memory_pool.h
    pod5_format/result.h
    pod5_format/dictionary_writer.h
    pod5_format/schema_field_builder.h
    pod5_format/schema_utils.h
    pod5_format/table_reader.h
    pod5_format/thread_pool.h
    pod5_format/tuple_utils.h
    pod5_format/types.h


    ${CMAKE_CURRENT_BINARY_DIR}/pod5_format/pod5_format_export.h
)

set(svb16_headers
    pod5_format/svb16/svb16.h
    pod5_format/svb16/common.hpp
    pod5_format/svb16/decode.hpp
    pod5_format/svb16/decode_scalar.hpp
    pod5_format/svb16/decode_x64.hpp
    pod5_format/svb16/encode.hpp
    pod5_format/svb16/encode_scalar.hpp
    pod5_format/svb16/encode_x64.hpp
    pod5_format/svb16/intrinsics.hpp
    pod5_format/svb16/shuffle_tables.hpp
    pod5_format/svb16/simd_detect_x64.hpp
)

set_target_properties(pod5_format
    PROPERTIES
        POSITION_INDEPENDENT_CODE 1
        CXX_STANDARD 20
        PUBLIC_HEADER "${public_headers}"
)

# Link these libraries publicly when doing a static lib build
set(maybe_public_libs
    arrow::arrow
    flatbuffers::flatbuffers
)

if (BUILD_SHARED_LIB)
    target_link_libraries(pod5_format PRIVATE ${maybe_public_libs})
else()
    target_link_libraries(pod5_format PUBLIC ${maybe_public_libs})
endif()

target_link_libraries(pod5_format
    PRIVATE
        pod5_flatbuffers
        zstd::zstd
        ZLIB::ZLIB
        Threads::Threads
)

if(APPLE)
    find_library(CORE_FOUNDATION CoreFoundation)
    target_link_libraries(pod5_format PRIVATE ${CORE_FOUNDATION})
endif()

target_include_directories(pod5_format
    PUBLIC
        ${CMAKE_CURRENT_SOURCE_DIR}
        ${CMAKE_CURRENT_BINARY_DIR}
)

flatbuffers_generate_headers(
    TARGET pod5_flatbuffers
    SCHEMAS
        pod5_format/flatbuffers/footer.fbs
    INCLUDE_PREFIX ""
    FLAGS --cpp
)

if (NOT MSVC)
    set(pod5_warning_options -Werror -Wall -Wno-comment -Wno-error=deprecated-declarations -Wno-deprecated-declarations)
    target_compile_options(pod5_format PRIVATE ${pod5_warning_options})
endif()
generate_export_header(pod5_format EXPORT_FILE_NAME pod5_format/pod5_format_export.h)

install(
    TARGETS pod5_format
    PUBLIC_HEADER DESTINATION "include/pod5_format"
)

install(
    FILES ${svb16_headers}
    DESTINATION "include/pod5_format/svb16"
)

if (POD5_BUILD_EXAMPLES)
    add_subdirectory(examples)
endif()
if (NOT POD5_DISABLE_TESTS)
    add_subdirectory(test)
endif()

if (BUILD_PYTHON_WHEEL)
    add_subdirectory(pod5_format_pybind)
endif()


================================================
FILE: c++/examples/CMakeLists.txt
================================================
add_executable(find_all_read_ids
    find_all_read_ids.cpp
)

target_link_libraries(find_all_read_ids
    pod5_format
)
# Needs C++17 to use pod5_format/uuid.h
set_target_properties(find_all_read_ids PROPERTIES CXX_STANDARD 17)

add_executable(find_specific_read_ids
    find_specific_read_ids.cpp
)

target_link_libraries(find_specific_read_ids
    pod5_format
)
# Needs C++17 to use pod5_format/uuid.h
set_target_properties(find_specific_read_ids PROPERTIES CXX_STANDARD 17)

add_executable(find_all_read_data
    find_all_read_data.cpp
)

target_link_libraries(find_all_read_data
    pod5_format
)
# Needs C++17 to use pod5_format/uuid.h
set_target_properties(find_all_read_data PROPERTIES CXX_STANDARD 17)

add_executable(find_specific_read_ids_with_signal
    find_specific_read_ids_with_signal.cpp
)

target_link_libraries(find_specific_read_ids_with_signal
    pod5_format
)
# Needs C++17 to use pod5_format/uuid.h
set_target_properties(find_specific_read_ids_with_signal PROPERTIES CXX_STANDARD 17)


================================================
FILE: c++/examples/README.md
================================================
C++ Examples
============

These examples use the POD5 C API to read file data, they are written using C++.

find_all_read_ids
-----------------

Find all the read ids in a given pod5 file, and save their read id to a text file.

find_specific_read_ids
----------------------

Find specific read ids in a given pod5 file, and save their read number to a text file.


================================================
FILE: c++/examples/find_all_read_data.cpp
================================================
#include "pod5_format/c_api.h"
#include "pod5_format/uuid.h"

#include <array>
#include <fstream>
#include <iostream>
#include <vector>

int main(int argc, char ** argv)
{
    if (argc != 2) {
        std::cerr << "Expected one argument - an pod5 file to search\n";
        return EXIT_FAILURE;
    }

    // Initialise the POD5 library:
    pod5_init();

    // Open the file ready for walking:
    Pod5FileReader_t * file = pod5_open_file(argv[1]);
    if (!file) {
        std::cerr << "Failed to open file " << argv[1] << ": " << pod5_get_error_string() << "\n";
        return EXIT_FAILURE;
    }

    std::size_t batch_count = 0;
    if (pod5_get_read_batch_count(&batch_count, file) != POD5_OK) {
        std::cerr << "Failed to query batch count: " << pod5_get_error_string() << "\n";
        return EXIT_FAILURE;
    }

    std::size_t read_count = 0;

    for (std::size_t batch_index = 0; batch_index < batch_count; ++batch_index) {
        std::cout << "batch_index: " << batch_index + 1 << "/" << batch_count << "\n";

        Pod5ReadRecordBatch_t * batch = nullptr;
        if (pod5_get_read_batch(&batch, file, batch_index) != POD5_OK) {
            std::cerr << "Failed to get batch: " << pod5_get_error_string() << "\n";
            return EXIT_FAILURE;
        }

        std::size_t batch_row_count = 0;
        if (pod5_get_read_batch_row_count(&batch_row_count, batch) != POD5_OK) {
            std::cerr << "Failed to get batch row count\n";
            return EXIT_FAILURE;
        }

        for (std::size_t row = 0; row < batch_row_count; ++row) {
            uint16_t read_table_version = 0;
            ReadBatchRowInfo_t read_data;
            if (pod5_get_read_batch_row_info_data(
                    batch, row, READ_BATCH_ROW_INFO_VERSION, &read_data, &read_table_version)
                != POD5_OK)
            {
                std::cerr << "Failed to get read " << row << ": " << pod5_get_error_string()
                          << "\n";
                return EXIT_FAILURE;
            }

            read_count += 1;

            std::size_t sample_count = 0;
            pod5_get_read_complete_sample_count(file, batch, row, &sample_count);

            std::vector<std::int16_t> samples;
            samples.resize(sample_count);
            pod5_get_read_complete_signal(file, batch, row, samples.size(), samples.data());

            // Run info
            RunInfoDictData_t * run_info = nullptr;
            if (pod5_get_run_info(batch, read_data.run_info, &run_info) != POD5_OK) {
                std::cerr << "Failed to get run info " + std::to_string(read_data.run_info) + " : "
                                 + pod5_get_error_string()
                          << "\n";
                return EXIT_FAILURE;
            }

            pod5_free_run_info(run_info);
        }

        if (pod5_free_read_batch(batch) != POD5_OK) {
            std::cerr << "Failed to release batch\n";
            return EXIT_FAILURE;
        }
    }

    std::cout << "Extracted " << read_count << " reads "
              << "\n";

    // Close the reader
    if (pod5_close_and_free_reader(file) != POD5_OK) {
        std::cerr << "Failed to close reader: " << pod5_get_error_string() << "\n";
        return EXIT_FAILURE;
    }

    // Cleanup the library
    pod5_terminate();
}


================================================
FILE: c++/examples/find_all_read_ids.cpp
================================================
#include "pod5_format/c_api.h"
#include "pod5_format/uuid.h"

#include <array>
#include <fstream>
#include <iostream>
#include <vector>

int main(int argc, char ** argv)
{
    if (argc != 2) {
        std::cerr << "Expected one argument - an pod5 file to search\n";
        return EXIT_FAILURE;
    }

    // Initialise the POD5 library:
    pod5_init();

    // Open the file ready for walking:
    Pod5FileReader_t * file = pod5_open_file(argv[1]);
    if (!file) {
        std::cerr << "Failed to open file " << argv[1] << ": " << pod5_get_error_string() << "\n";
        return EXIT_FAILURE;
    }

    std::size_t batch_count = 0;
    if (pod5_get_read_batch_count(&batch_count, file) != POD5_OK) {
        std::cerr << "Failed to query batch count: " << pod5_get_error_string() << "\n";
        return EXIT_FAILURE;
    }

    std::string output_path("read_ids.txt");
    std::cout << "Writing read ids to " << output_path << "\n";
    std::ofstream output_stream(output_path);

    std::size_t read_count = 0;

    for (std::size_t batch_index = 0; batch_index < batch_count; ++batch_index) {
        Pod5ReadRecordBatch_t * batch = nullptr;
        if (pod5_get_read_batch(&batch, file, batch_index) != POD5_OK) {
            std::cerr << "Failed to get batch: " << pod5_get_error_string() << "\n";
            return EXIT_FAILURE;
        }

        std::size_t batch_row_count = 0;
        if (pod5_get_read_batch_row_count(&batch_row_count, batch) != POD5_OK) {
            std::cerr << "Failed to get batch row count\n";
            return EXIT_FAILURE;
        }

        for (std::size_t row = 0; row < batch_row_count; ++row) {
            uint16_t read_table_version = 0;
            ReadBatchRowInfo_t read_data;
            if (pod5_get_read_batch_row_info_data(
                    batch, row, READ_BATCH_ROW_INFO_VERSION, &read_data, &read_table_version)
                != POD5_OK)
            {
                std::cerr << "Failed to get read " << row << "\n";
                return EXIT_FAILURE;
            }

            std::array<char, 37> formatted_read_id;
            pod5_format_read_id(read_data.read_id, formatted_read_id.data());
            output_stream << formatted_read_id.data() << "\n";
            read_count += 1;

            std::size_t sample_count = 0;
            pod5_get_read_complete_sample_count(file, batch, row, &sample_count);

            std::vector<std::int16_t> samples;
            samples.resize(sample_count);
            pod5_get_read_complete_signal(file, batch, row, samples.size(), samples.data());
        }

        if (pod5_free_read_batch(batch) != POD5_OK) {
            std::cerr << "Failed to release batch\n";
            return EXIT_FAILURE;
        }
    }

    std::cout << "Extracted " << read_count << " read ids into " << output_path << "\n";

    // Close the reader
    if (pod5_close_and_free_reader(file) != POD5_OK) {
        std::cerr << "Failed to close reader: " << pod5_get_error_string() << "\n";
        return EXIT_FAILURE;
    }

    // Cleanup the library
    pod5_terminate();
}


================================================
FILE: c++/examples/find_specific_read_ids.cpp
================================================
#include "pod5_format/c_api.h"
#include "pod5_format/uuid.h"

#include <fstream>
#include <iostream>
#include <vector>

int main(int argc, char ** argv)
{
    if (argc != 3) {
        std::cerr << "Expected two arguments:\n"
                  << " - an pod5 file to search\n"
                  << " - a file containing newline separated of read ids\n";
        return EXIT_FAILURE;
    }

    // Initialise the POD5 library:
    pod5_init();

    // Open the file ready for walking:
    Pod5FileReader_t * file = pod5_open_file(argv[1]);
    if (!file) {
        std::cerr << "Failed to open file " << argv[1] << ": " << pod5_get_error_string() << "\n";
        return EXIT_FAILURE;
    }

    std::size_t batch_count = 0;
    if (pod5_get_read_batch_count(&batch_count, file) != POD5_OK) {
        std::cerr << "Failed to query batch count: " << pod5_get_error_string() << "\n";
        return EXIT_FAILURE;
    }

    std::vector<pod5::Uuid> search_uuids;
    std::string input_path(argv[2]);
    try {
        std::cout << "Reading input read ids from " << input_path << "\n";
        std::string line;
        std::ifstream input_stream(input_path);
        while (std::getline(input_stream, line)) {
            auto const uuid = pod5::Uuid::from_string(line);
            if (!uuid) {
                std::cerr << '"' << line << "\" is not a valid UUID, ignoring it\n";
            } else {
                search_uuids.push_back(*uuid);
            }
        }
        std::cout << "  Read " << search_uuids.size() << " ids from the text file\n";
    } catch (std::exception const & e) {
        std::cerr << "Failed to parse UUID values from " << input_path << ": " << e.what() << "\n";
    }

    std::string output_path("read_ids.txt");
    std::cout << "Writing selected read numbers to " << output_path << "\n";
    std::ofstream output_stream(output_path);

    // Plan the most efficient route through the file for the required read ids:
    std::vector<std::uint32_t> traversal_batch_counts(batch_count);
    std::vector<std::uint32_t> traversal_row_indices(search_uuids.size());
    std::size_t find_success_count = 0;
    if (pod5_plan_traversal(
            file,
            (uint8_t *)search_uuids.data(),
            search_uuids.size(),
            traversal_batch_counts.data(),
            traversal_row_indices.data(),
            &find_success_count)
        != POD5_OK)
    {
        std::cerr << "Failed to plan traversal of file: " << pod5_get_error_string() << "\n";
        return EXIT_FAILURE;
    }

    if (find_success_count != search_uuids.size()) {
        std::cerr << "Failed to find " << (search_uuids.size() - find_success_count) << " reads\n";
    }

    std::size_t read_count = 0;
    std::size_t row_offset = 0;

    // Walk the suggested traversal route, storing read data.
    for (std::size_t batch_index = 0; batch_index < batch_count; ++batch_index) {
        Pod5ReadRecordBatch_t * batch = nullptr;
        if (pod5_get_read_batch(&batch, file, batch_index) != POD5_OK) {
            std::cerr << "Failed to get batch: " << pod5_get_error_string() << "\n";
            return EXIT_FAILURE;
        }

        std::cout << "Processing batch " << (batch_index + 1) << " of " << batch_count << "\n";
        for (std::size_t row_index = 0; row_index < traversal_batch_counts[batch_index];
             ++row_index)
        {
            std::uint32_t batch_row = traversal_row_indices[row_index + row_offset];

            uint16_t read_table_version = 0;
            ReadBatchRowInfo_t read_data;
            if (pod5_get_read_batch_row_info_data(
                    batch, batch_row, READ_BATCH_ROW_INFO_VERSION, &read_data, &read_table_version)
                != POD5_OK)
            {
                std::cerr << "Failed to get read " << batch_row << "\n";
                return EXIT_FAILURE;
            }

            output_stream << read_data.read_number << "\n";
            read_count += 1;
        }
        row_offset += traversal_batch_counts[batch_index];

        if (pod5_free_read_batch(batch) != POD5_OK) {
            std::cerr << "Failed to release batch\n";
            return EXIT_FAILURE;
        }
    }

    std::cout << "Extracted " << read_count << " read numbers into " << output_path << "\n";

    // Close the reader
    if (pod5_close_and_free_reader(file) != POD5_OK) {
        std::cerr << "Failed to close reader: " << pod5_get_error_string() << "\n";
        return EXIT_FAILURE;
    }

    // Cleanup the library
    pod5_terminate();
}


================================================
FILE: c++/examples/find_specific_read_ids_with_signal.cpp
================================================
#include "pod5_format/c_api.h"
#include "pod5_format/uuid.h"

#include <fstream>
#include <iostream>
#include <vector>

int main(int argc, char ** argv)
{
    if (argc != 3) {
        std::cerr << "Expected two arguments:\n"
                  << " - an pod5 file to search\n"
                  << " - a file containing newline separated of read ids\n";
        return EXIT_FAILURE;
    }

    // Initialise the POD5 library:
    pod5_init();

    // Open the file ready for walking:
    Pod5FileReader_t * file = pod5_open_file(argv[1]);
    if (!file) {
        std::cerr << "Failed to open file " << argv[1] << ": " << pod5_get_error_string() << "\n";
        return EXIT_FAILURE;
    }

    std::size_t batch_count = 0;
    if (pod5_get_read_batch_count(&batch_count, file) != POD5_OK) {
        std::cerr << "Failed to query batch count: " << pod5_get_error_string() << "\n";
        return EXIT_FAILURE;
    }

    std::vector<pod5::Uuid> search_uuids;
    std::string input_path(argv[2]);
    try {
        std::cout << "Reading input read ids from " << input_path << "\n";
        std::string line;
        std::ifstream input_stream(input_path);
        while (std::getline(input_stream, line)) {
            auto const uuid = pod5::Uuid::from_string(line);
            if (!uuid) {
                std::cerr << '"' << line << "\" is not a valid UUID, ignoring it\n";
            } else {
                search_uuids.push_back(*uuid);
            }
        }
        std::cout << "  Read " << search_uuids.size() << " ids from the text file\n";
    } catch (std::exception const & e) {
        std::cerr << "Failed to parse UUID values from " << input_path << ": " << e.what() << "\n";
    }

    std::string output_path("read_ids.txt");
    std::cout << "Writing selected read numbers to " << output_path << "\n";
    std::ofstream output_stream(output_path);

    // Plan the most efficient route through the file for the required read ids:
    std::vector<std::uint32_t> traversal_batch_counts(batch_count);
    std::vector<std::uint32_t> traversal_row_indices(search_uuids.size());
    std::size_t find_success_count = 0;
    if (pod5_plan_traversal(
            file,
            (uint8_t *)search_uuids.data(),
            search_uuids.size(),
            traversal_batch_counts.data(),
            traversal_row_indices.data(),
            &find_success_count)
        != POD5_OK)
    {
        std::cerr << "Failed to plan traversal of file: " << pod5_get_error_string() << "\n";
        return EXIT_FAILURE;
    }

    if (find_success_count != search_uuids.size()) {
        std::cerr << "Failed to find " << (search_uuids.size() - find_success_count) << " reads\n";
    }

    std::size_t read_count = 0;
    std::size_t samples_read = 0;

    std::size_t row_offset = 0;

    // Walk the suggested traversal route, storing read data.
    for (std::size_t batch_index = 0; batch_index < batch_count; ++batch_index) {
        Pod5ReadRecordBatch_t * batch = nullptr;
        if (pod5_get_read_batch(&batch, file, batch_index) != POD5_OK) {
            std::cerr << "Failed to get batch: " << pod5_get_error_string() << "\n";
            return EXIT_FAILURE;
        }

        std::cout << "Processing batch " << (batch_index + 1) << " of " << batch_count << "\n";
        for (std::size_t row_index = 0; row_index < traversal_batch_counts[batch_index];
             ++row_index)
        {
            std::uint32_t batch_row = traversal_row_indices[row_index + row_offset];

            uint16_t read_table_version = 0;
            ReadBatchRowInfo_t read_data;
            if (pod5_get_read_batch_row_info_data(
                    batch, batch_row, READ_BATCH_ROW_INFO_VERSION, &read_data, &read_table_version)
                != POD5_OK)
            {
                std::cerr << "Failed to get read " << batch_row << "\n";
                return EXIT_FAILURE;
            }

            std::size_t sample_count = 0;
            pod5_get_read_complete_sample_count(file, batch, batch_row, &sample_count);

            std::vector<std::int16_t> samples;
            samples.resize(sample_count);
            pod5_get_read_complete_signal(file, batch, batch_row, samples.size(), samples.data());

            std::int64_t samples_sum = 0;
            for (std::size_t i = 0; i < samples.size(); ++i) {
                samples_sum += samples[i];
            }

            output_stream << read_data.calibration_offset << " " << read_data.calibration_scale
                          << " " << samples_sum << "\n";
            read_count += 1;
            samples_read += samples.size();
        }
        row_offset += traversal_batch_counts[batch_index];

        if (pod5_free_read_batch(batch) != POD5_OK) {
            std::cerr << "Failed to release batch\n";
            return EXIT_FAILURE;
        }
    }

    std::cout << "Extracted " << read_count << " reads and " << samples_read << " samples into "
              << output_path << "\n";

    // Close the reader
    if (pod5_close_and_free_reader(file) != POD5_OK) {
        std::cerr << "Failed to close reader: " << pod5_get_error_string() << "\n";
        return EXIT_FAILURE;
    }

    // Cleanup the library
    pod5_terminate();
}


================================================
FILE: c++/pod5_format/async_signal_loader.cpp
================================================
#include "pod5_format/async_signal_loader.h"

namespace pod5 {

std::size_t const AsyncSignalLoader::MINIMUM_JOB_SIZE = 50;

AsyncSignalLoader::AsyncSignalLoader(
    std::shared_ptr<pod5::FileReader> const & reader,
    SamplesMode samples_mode,
    gsl::span<std::uint32_t const> const & batch_counts,
    gsl::span<std::uint32_t const> const & batch_rows,
    std::size_t worker_count,
    std::size_t max_pending_batches)
: m_reader(reader)
, m_samples_mode(samples_mode)
, m_max_pending_batches(max_pending_batches)
, m_reads_batch_count(m_reader->num_read_record_batches())
, m_batch_counts(batch_counts)
, m_total_batch_count_so_far(0)
, m_batch_rows(batch_rows)
, m_worker_job_size(
      std::max<std::size_t>(
          MINIMUM_JOB_SIZE,
          m_batch_rows.size() / (m_reads_batch_count * worker_count * 2)))
, m_current_batch(0)
, m_finished(false)
, m_has_error(false)
, m_batches_size(0)
{
    // Setup first batch:
    {
        std::unique_lock<std::mutex> l(m_worker_sync);
        auto setup_result = setup_next_in_progress_batch(l);
        if (!setup_result.ok()) {
            set_error(setup_result);
        }
    }

    // Kick off workers on jobs:
    for (std::size_t i = 0; i < worker_count; ++i) {
        m_workers.emplace_back([&] { run_worker(); });
    }
}

AsyncSignalLoader::~AsyncSignalLoader()
{
    m_finished = true;
    // Wait for all workers to complete:
    for (std::size_t i = 0; i < m_workers.size(); ++i) {
        m_workers[i].join();
    }
}

Result<std::unique_ptr<CachedBatchSignalData>> AsyncSignalLoader::release_next_batch(
    std::optional<std::chrono::steady_clock::time_point> timeout)
{
    std::shared_ptr<SignalCacheWorkPackage> batch;

    // Return any error, if one has occurred:
    if (m_has_error) {
        return error();
    }

    // First wait until there is a batch available:
    do {
        std::unique_lock<std::mutex> l(m_batches_sync);
        // Wait until there is a batch available:
        m_batch_done.wait_until(
            l, timeout.value_or(std::chrono::steady_clock::now() + std::chrono::seconds(5)), [&] {
                return m_batches.size() || m_finished || m_has_error;
            });

        // Grab a batch if one exists (note error or user destroying us might have happened instead):
        if (!m_batches.empty()) {
            batch = std::move(m_batches.front());
            assert(batch);
            m_batches.pop_front();
            m_batches_size -= 1;
            break;
        }

        if (timeout && std::chrono::steady_clock::now() > *timeout) {
            return nullptr;
        }
    } while (!m_finished && !m_has_error);

    // Return any error, if one has occurred during our wait:
    if (m_has_error) {
        return error();
    }

    // If we got a batch, wait for all work to be finished, then return it:
    if (batch) {
        // Wait if we are ahead of the loader:
        while (!batch->is_complete()) {
            std::this_thread::sleep_for(std::chrono::milliseconds(1));
        }

        return batch->release_data();
    }

    // No more data - return null.
    return nullptr;
}

void AsyncSignalLoader::set_error(pod5::Status status)
{
    assert(!status.ok());
    {
        std::lock_guard<std::mutex> l{m_error_mutex};
        m_error = std::move(status);
    }
    m_has_error = true;
}

pod5::Status AsyncSignalLoader::error() const
{
    std::lock_guard<std::mutex> l{m_error_mutex};
    return m_error;
}

void AsyncSignalLoader::run_worker()
{
    // Continue to work while there is work to do, and no error has occurred
    while (!m_finished && !m_has_error) {
        std::shared_ptr<SignalCacheWorkPackage> batch;
        std::uint32_t row_start = 0;

        // Try to secure some new work:
        {
            std::unique_lock<std::mutex> l(m_worker_sync);
            // If we have run out of batches to process, release anything in progress and return:
            if (m_current_batch >= m_reads_batch_count) {
                release_in_progress_batch();
                break;
            }

            // If we have more batches than asked for complete that have
            // not been queried, wait for it to get taken:
            if (m_batches_size > m_max_pending_batches) {
                l.unlock();
                std::this_thread::sleep_for(std::chrono::milliseconds(10));
                continue;
            }

            // Now, if we have no work left in the current batch, release that:
            if (!m_in_progress_batch->has_work_left()) {
                if (!m_batch_counts.empty()) {
                    m_total_batch_count_so_far += m_batch_counts[m_current_batch];
                }

                // Release the current batch:
                release_in_progress_batch();

                // Then try to setup the next batch, if one exists:
                m_current_batch += 1;
                if (m_current_batch >= m_reads_batch_count) {
                    // No more work to do.
                    m_finished = true;
                    break;
                }

                auto setup_result = setup_next_in_progress_batch(l);
                if (!setup_result.ok()) {
                    set_error(setup_result);
                    return;
                }
            }

            // Finally, tell the work package we have secured we are starting to do some work:
            batch = m_in_progress_batch;
            row_start = m_in_progress_batch->start_rows(l, m_worker_job_size);
        }

        // Now execute the work, for all the rows we said we would:
        std::uint32_t const row_end =
            std::min(row_start + m_worker_job_size, batch->job_row_count());

        do_work(batch, row_start, row_end);

        // And report the work completed for anyone waiting:
        batch->complete_rows(m_worker_job_size);
    }
}

void AsyncSignalLoader::do_work(
    std::shared_ptr<SignalCacheWorkPackage> const & batch,
    std::uint32_t row_start,
    std::uint32_t row_end)
{
    // First secure the sample counts column for the batch we are processing:
    auto signal_column = batch->read_batch().signal_column();

    // And record where we are starting in the batch rows array, if it exists:
    for (std::uint32_t i = row_start; i < row_end; ++i) {
        // Find the actual batch row to query - we may be working on a subset of batch data:
        auto const actual_batch_row = batch->get_batch_row_to_query(i);
        // Get the signal row data for the read:
        auto const signal_rows = std::static_pointer_cast<arrow::UInt64Array>(
            signal_column->value_slice(actual_batch_row));
        auto const signal_rows_span =
            gsl::make_span(signal_rows->raw_values(), signal_rows->length());

        // Find the sample count for these rows:
        auto sample_count_result = m_reader->extract_sample_count(signal_rows_span);
        if (!sample_count_result.ok()) {
            set_error(sample_count_result.status());
            return;
        }
        std::uint64_t sample_count = *sample_count_result;

        // And query the samples if that has been requested:
        std::vector<std::int16_t> samples;
        if (m_samples_mode == SamplesMode::Samples) {
            samples.resize(sample_count);
            auto samples_result =
                m_reader->extract_samples(signal_rows_span, gsl::make_span(samples));
            if (!samples_result.ok()) {
                set_error(std::move(samples_result));
                return;
            }
            sample_count = samples.size();
        }

        // Store the queried data into the batch:
        batch->set_samples(i, sample_count, std::move(samples));
    }
}

Status AsyncSignalLoader::setup_next_in_progress_batch(std::unique_lock<std::mutex> & lock)
{
    assert(!m_in_progress_batch);
    ARROW_ASSIGN_OR_RAISE(auto read_batch, m_reader->read_read_record_batch(m_current_batch));
    std::size_t row_count = read_batch.num_rows();

    gsl::span<std::uint32_t const> next_specific_batch_rows;
    if (!m_batch_counts.empty()) {
        row_count = m_batch_counts[m_current_batch];
        if (!m_batch_rows.empty()) {
            next_specific_batch_rows = m_batch_rows.subspan(m_total_batch_count_so_far, row_count);
        }
    }

    m_in_progress_batch = std::make_shared<SignalCacheWorkPackage>(
        m_current_batch, row_count, next_specific_batch_rows, std::move(read_batch));
    return Status::OK();
}

void AsyncSignalLoader::release_in_progress_batch()
{
    if (m_in_progress_batch) {
        assert(!m_in_progress_batch->has_work_left());
        std::lock_guard<std::mutex> l(m_batches_sync);
        m_batches.emplace_back(std::move(m_in_progress_batch));
        m_batches_size += 1;
        m_batch_done.notify_all();
    }
}

}  // namespace pod5


================================================
FILE: c++/pod5_format/async_signal_loader.h
================================================
#pragma once

#include "pod5_format/file_reader.h"
#include "pod5_format/pod5_format_export.h"
#include "pod5_format/read_table_reader.h"
#include "pod5_format/signal_table_reader.h"

#include <arrow/array/array_nested.h>
#include <arrow/array/array_primitive.h>

#include <condition_variable>
#include <deque>
#include <memory>
#include <mutex>
#include <optional>
#include <thread>

namespace pod5 {

class POD5_FORMAT_EXPORT CachedBatchSignalData {
public:
    CachedBatchSignalData(std::uint32_t batch_index, std::size_t entry_count)
    : m_batch_index(batch_index)
    , m_sample_counts(entry_count)
    , m_samples(entry_count)
    {
    }

    std::uint32_t batch_index() const { return m_batch_index; }

    /// Find a list of sample counts for all requested batch rows.
    std::vector<std::uint64_t> const & sample_count() const { return m_sample_counts; }

    /// Find a list of signal samples counts for all requested batch rows.
    std::vector<std::vector<std::int16_t>> const & samples() const { return m_samples; }

    void
    set_samples(std::size_t row, std::uint64_t sample_count, std::vector<std::int16_t> && samples)
    {
        m_sample_counts[row] = sample_count;
        m_samples[row] = std::move(samples);
    }

private:
    std::uint32_t m_batch_index;
    std::vector<std::uint64_t> m_sample_counts;
    std::vector<std::vector<std::int16_t>> m_samples;
};

class POD5_FORMAT_EXPORT SignalCacheWorkPackage {
public:
    SignalCacheWorkPackage(
        std::uint32_t batch_index,
        std::size_t job_row_count,
        gsl::span<std::uint32_t const> const & specific_job_rows,
        pod5::ReadTableRecordBatch && read_batch)
    : m_job_row_count(job_row_count)
    , m_specific_job_rows(specific_job_rows)
    , m_next_row_to_start(0)
    , m_completed_rows(0)
    , m_cached_data(std::make_unique<CachedBatchSignalData>(batch_index, m_job_row_count))
    , m_read_batch(std::move(read_batch))
    {
    }

    std::uint32_t job_row_count() const { return m_job_row_count; }

    void
    set_samples(std::size_t row, std::uint64_t sample_count, std::vector<std::int16_t> && samples)
    {
        m_cached_data->set_samples(row, sample_count, std::move(samples));
    }

    std::unique_ptr<CachedBatchSignalData> release_data() { return std::move(m_cached_data); }

    pod5::ReadTableRecordBatch const & read_batch() const { return m_read_batch; }

    // Find the actual batch row to query, for a given job row index.
    std::uint32_t get_batch_row_to_query(std::uint32_t job_row_index) const
    {
        // We allow the caller to specify a subset of batch rows to iterate:
        if (!m_specific_job_rows.empty()) {
            return m_specific_job_rows[job_row_index];
        }

        return job_row_index;
    }

    std::uint32_t start_rows(std::unique_lock<std::mutex> & l, std::size_t row_count)
    {
        auto row = m_next_row_to_start;
        m_next_row_to_start += row_count;
        return row;
    }

    void complete_rows(std::uint32_t row_count) { m_completed_rows += row_count; }

    bool has_work_left() const { return m_next_row_to_start < m_job_row_count; }

    bool is_complete() const { return m_completed_rows.load() >= m_job_row_count; }

private:
    std::size_t m_job_row_count;
    gsl::span<std::uint32_t const> m_specific_job_rows;

    std::uint32_t m_next_row_to_start;
    std::atomic<std::uint32_t> m_completed_rows;

    std::unique_ptr<CachedBatchSignalData> m_cached_data;
    pod5::ReadTableRecordBatch m_read_batch;
};

class POD5_FORMAT_EXPORT AsyncSignalLoader {
public:
    // Minimum number of tasks one thread will do in a batch.
    static std::size_t const MINIMUM_JOB_SIZE;
    enum class SamplesMode {
        NoSamples,
        Samples,
    };

    AsyncSignalLoader(
        std::shared_ptr<pod5::FileReader> const & reader,
        SamplesMode samples_mode,
        gsl::span<std::uint32_t const> const & batch_counts,
        gsl::span<std::uint32_t const> const & batch_rows,
        std::size_t worker_count = std::thread::hardware_concurrency(),
        std::size_t max_pending_batches = 10);

    ~AsyncSignalLoader();

    /// Find if all work is complete in the loader.
    bool is_finished() const { return m_finished; }

    /// Get the next batch of loaded signal, always returns the consecutive next signal batch
    /// \note Returns nullptr when timeoout occurs, or if all data is exhausted.
    Result<std::unique_ptr<CachedBatchSignalData>> release_next_batch(
        std::optional<std::chrono::steady_clock::time_point> timeout = std::nullopt);

private:
    /// Set an error code that will stop all async loading and return an error to the caller.
    void set_error(pod5::Status status);
    pod5::Status error() const;

    void run_worker();
    void do_work(
        std::shared_ptr<SignalCacheWorkPackage> const & batch,
        std::uint32_t row_start,
        std::uint32_t row_end);

    /// Setup a new batch for in progress work to contain.
    /// \param lock A lock held on m_worker_sync.
    /// \note There must not be a batch already in progress.
    /// \note m_current_batch is used as the index of the next batch to begin.
    Status setup_next_in_progress_batch(std::unique_lock<std::mutex> & lock);

    /// Release the currently in progress batch to readers, if it exists.
    /// \note This call locks m_batches_sync internally.
    /// \note The batch must not have any work remaining to start, but can be completing already started work.
    /// \note This call notifys the condition variable to alert readers that new data is available.
    void release_in_progress_batch();

    std::shared_ptr<pod5::FileReader> m_reader;
    SamplesMode m_samples_mode;
    std::size_t m_max_pending_batches;
    std::size_t m_reads_batch_count;
    gsl::span<std::uint32_t const> m_batch_counts;
    std::size_t m_total_batch_count_so_far;
    gsl::span<std::uint32_t const> m_batch_rows;

    std::uint32_t const m_worker_job_size;

    std::mutex m_worker_sync;
    std::condition_variable m_batch_done;
    std::uint32_t m_current_batch;

    std::atomic<bool> m_finished;
    std::atomic<bool> m_has_error;
    mutable std::mutex m_error_mutex;
    pod5::Status m_error;
    std::shared_ptr<SignalCacheWorkPackage> m_in_progress_batch;

    std::mutex m_batches_sync;
    std::atomic<std::uint32_t> m_batches_size;
    std::deque<std::shared_ptr<SignalCacheWorkPackage>> m_batches;

    std::vector<std::thread> m_workers;
};

}  // namespace pod5


================================================
FILE: c++/pod5_format/c_api.cpp
================================================
#include "pod5_format/c_api.h"

#include "pod5_format/file_reader.h"
#include "pod5_format/file_writer.h"
#include "pod5_format/read_table_reader.h"
#include "pod5_format/signal_compression.h"
#include "pod5_format/signal_table_reader.h"
#include "pod5_format/uuid.h"

#include <arrow/array/array_binary.h>
#include <arrow/array/array_dict.h>
#include <arrow/array/array_nested.h>
#include <arrow/array/array_primitive.h>
#include <arrow/memory_pool.h>
#include <arrow/type.h>

#include <limits>
#include <optional>

//---------------------------------------------------------------------------------------------------------------------
struct Pod5FileReader {
    Pod5FileReader(std::shared_ptr<pod5::FileReader> && reader_) : reader(std::move(reader_)) {}

    std::shared_ptr<pod5::FileReader const> reader;
};

struct Pod5FileWriter {
    Pod5FileWriter(std::unique_ptr<pod5::FileWriter> && writer_) : writer(std::move(writer_)) {}

    std::unique_ptr<pod5::FileWriter> writer;
};

struct Pod5ReadRecordBatch {
    Pod5ReadRecordBatch(
        pod5::ReadTableRecordBatch && batch_,
        std::shared_ptr<pod5::FileReader const> reader)
    : batch(std::move(batch_))
    , reader(std::move(reader))
    {
    }

    pod5::ReadTableRecordBatch const batch;
    std::shared_ptr<pod5::FileReader const> reader;
};

namespace {
//---------------------------------------------------------------------------------------------------------------------
thread_local pod5_error_t g_pod5_error_no;
thread_local std::string g_pod5_error_string;

void pod5_set_error(arrow::Status status)
{
    g_pod5_error_no = (pod5_error_t)status.code();
    g_pod5_error_string = status.ToString();
}

void pod5_reset_error()
{
    g_pod5_error_no = pod5_error_t::POD5_OK;
    g_pod5_error_string.clear();
}

#define POD5_C_RETURN_NOT_OK(result)    \
    do {                                \
        ::arrow::Status __s = (result); \
        if (!__s.ok()) {                \
            pod5_set_error(__s);        \
            return g_pod5_error_no;     \
        }                               \
    } while (0)

#define POD5_C_ASSIGN_OR_RAISE_IMPL(result_name, lhs, rexpr) \
    auto && result_name = (rexpr);                           \
    if (!(result_name).ok()) {                               \
        pod5_set_error((result_name).status());              \
        return g_pod5_error_no;                              \
    }                                                        \
    lhs = std::move(result_name).ValueUnsafe();

#define POD5_C_ASSIGN_OR_RAISE(lhs, rexpr) \
    POD5_C_ASSIGN_OR_RAISE_IMPL(           \
        ARROW_ASSIGN_OR_RAISE_NAME(_error_or_value, __COUNTER__), lhs, rexpr);

//---------------------------------------------------------------------------------------------------------------------
bool check_string_not_empty(char const * str)
{
    if (!str) {
        pod5_set_error(arrow::Status::Invalid("null string passed to C API"));
        return false;
    }

    if (strlen(str) == 0) {
        pod5_set_error(arrow::Status::Invalid("empty string passed to C API"));
        return false;
    }

    return true;
}

bool check_not_null(void const * ptr)
{
    if (!ptr) {
        pod5_set_error(arrow::Status::Invalid("null passed to C API"));
        return false;
    }
    return true;
}

bool check_file_not_null(void const * file)
{
    if (!file) {
        pod5_set_error(arrow::Status::Invalid("null file passed to C API"));
        return false;
    }
    return true;
}

bool check_output_pointer_not_null(void const * output)
{
    if (!output) {
        pod5_set_error(arrow::Status::Invalid("null output parameter passed to C API"));
        return false;
    }
    return true;
}

//---------------------------------------------------------------------------------------------------------------------
pod5::FileWriterOptions make_internal_writer_options(Pod5WriterOptions const * options)
{
    pod5::FileWriterOptions internal_options;
    if (options) {
        if (options->max_signal_chunk_size != 0) {
            internal_options.set_max_signal_chunk_size(options->max_signal_chunk_size);
        }

        if (options->signal_compression_type == UNCOMPRESSED_SIGNAL) {
            internal_options.set_signal_type(pod5::SignalType::UncompressedSignal);
        }

        if (options->signal_table_batch_size != 0) {
            internal_options.set_signal_table_batch_size(options->signal_table_batch_size);
        }
        if (options->read_table_batch_size != 0) {
            internal_options.set_read_table_batch_size(options->read_table_batch_size);
        }
    }
    return internal_options;
}

pod5::FileReaderOptions make_internal_reader_options(Pod5ReaderOptions const & options)
{
    pod5::FileReaderOptions internal_options;
    internal_options.set_force_disable_file_mapping(options.force_disable_file_mapping);
    return internal_options;
}

}  // namespace

extern "C" {

//---------------------------------------------------------------------------------------------------------------------
pod5_error_t pod5_init()
{
    pod5_reset_error();
    POD5_C_RETURN_NOT_OK(pod5::register_extension_types());
    return POD5_OK;
}

pod5_error_t pod5_terminate()
{
    pod5_reset_error();
    POD5_C_RETURN_NOT_OK(pod5::unregister_extension_types());
    return POD5_OK;
}

pod5_error_t pod5_get_error_no() { return g_pod5_error_no; }

char const * pod5_get_error_string() { return g_pod5_error_string.c_str(); }

//---------------------------------------------------------------------------------------------------------------------
Pod5FileReader * pod5_open_file(char const * filename)
{
    Pod5ReaderOptions_t options{};
    return pod5_open_file_options(filename, &options);
}

Pod5FileReader * pod5_open_file_options(char const * filename, Pod5ReaderOptions_t const * options)
{
    pod5_reset_error();

    if (!check_string_not_empty(filename) || !check_not_null(options)) {
        return nullptr;
    }

    auto internal_reader = pod5::open_file_reader(filename, make_internal_reader_options(*options));
    if (!internal_reader.ok()) {
        pod5_set_error(internal_reader.status());
        return nullptr;
    }

    auto reader = std::make_unique<Pod5FileReader>(std::move(*internal_reader));
    return reader.release();
}

pod5_error_t pod5_close_and_free_reader(Pod5FileReader * file)
{
    pod5_reset_error();

    std::unique_ptr<Pod5FileReader> ptr{file};
    ptr.reset();
    return POD5_OK;
}

pod5_error_t pod5_get_file_info(Pod5FileReader_t const * reader, FileInfo * file_info)
{
    pod5_reset_error();

    if (!check_file_not_null(reader) || !check_output_pointer_not_null(file_info)) {
        return g_pod5_error_no;
    }

    auto const metadata = reader->reader->schema_metadata();
    metadata.file_identifier.to_c_array(file_info->file_identifier);

    file_info->version.major = metadata.writing_pod5_version.major_version();
    file_info->version.minor = metadata.writing_pod5_version.minor_version();
    file_info->version.revision = metadata.writing_pod5_version.revision_version();

    return POD5_OK;
}

pod5_error_t pod5_get_file_read_table_location(
    Pod5FileReader_t const * reader,
    EmbeddedFileData_t * file_data)
{
    pod5_reset_error();

    if (!check_file_not_null(reader) || !check_output_pointer_not_null(file_data)) {
        return g_pod5_error_no;
    }
    auto const & read_table_location = reader->reader->read_table_location();

    file_data->file_name = read_table_location.file_path.c_str();
    file_data->offset = read_table_location.offset;
    file_data->length = read_table_location.size;
    return POD5_OK;
}

pod5_error_t pod5_get_file_signal_table_location(
    Pod5FileReader_t const * reader,
    EmbeddedFileData_t * file_data)
{
    pod5_reset_error();

    if (!check_file_not_null(reader) || !check_output_pointer_not_null(file_data)) {
        return g_pod5_error_no;
    }
    auto const & signal_table_location = reader->reader->signal_table_location();

    file_data->file_name = signal_table_location.file_path.c_str();
    file_data->offset = signal_table_location.offset;
    file_data->length = signal_table_location.size;
    return POD5_OK;
}

pod5_error_t pod5_get_file_run_info_table_location(
    Pod5FileReader_t const * reader,
    EmbeddedFileData_t * file_data)
{
    pod5_reset_error();

    if (!check_file_not_null(reader) || !check_output_pointer_not_null(file_data)) {
        return g_pod5_error_no;
    }
    auto const & run_info_table_location = reader->reader->run_info_table_location();

    file_data->file_name = run_info_table_location.file_path.c_str();
    file_data->offset = run_info_table_location.offset;
    file_data->length = run_info_table_location.size;
    return POD5_OK;
}

pod5_error_t pod5_get_read_count(Pod5FileReader_t const * reader, size_t * count)
{
    pod5_reset_error();

    if (!check_file_not_null(reader) || !check_output_pointer_not_null(count)) {
        return g_pod5_error_no;
    }

    POD5_C_ASSIGN_OR_RAISE(*count, reader->reader->read_count());

    return POD5_OK;
}

pod5_error_t pod5_get_read_ids(Pod5FileReader_t const * reader, size_t count, read_id_t * read_ids)
{
    pod5_reset_error();

    if (!check_file_not_null(reader) || !check_output_pointer_not_null(read_ids)) {
        return g_pod5_error_no;
    }

    POD5_C_ASSIGN_OR_RAISE(auto read_count, reader->reader->read_count());
    if (count < read_count) {
        pod5_set_error(arrow::Status::Invalid("array to short to receive read ids"));
        return g_pod5_error_no;
    }

    std::size_t count_so_far = 0;
    for (std::size_t i = 0; i < reader->reader->num_read_record_batches(); ++i) {
        POD5_C_ASSIGN_OR_RAISE(auto const batch, reader->reader->read_read_record_batch(i));

        auto const read_id_column = batch.read_id_column();
        auto raw_data = reinterpret_cast<uint8_t const *>(read_id_column->raw_values());
        std::copy(
            raw_data,
            raw_data + (read_id_column->length() * sizeof(read_id_t)),
            reinterpret_cast<uint8_t *>(read_ids + count_so_far));
        count_so_far += read_id_column->length();
    }

    return POD5_OK;
}

pod5_error_t pod5_plan_traversal(
    Pod5FileReader_t const * reader,
    uint8_t const * read_id_array,
    size_t read_id_count,
    uint32_t * batch_counts,
    uint32_t * batch_rows,
    size_t * find_success_count_out)
{
    pod5_reset_error();

    if (!check_file_not_null(reader) || !check_not_null(read_id_array)
        || !check_output_pointer_not_null(batch_counts)
        || !check_output_pointer_not_null(batch_rows)
        || !check_output_pointer_not_null(find_success_count_out))
    {
        return g_pod5_error_no;
    }

    auto search_input = pod5::ReadIdSearchInput(
        gsl::make_span(reinterpret_cast<pod5::Uuid const *>(read_id_array), read_id_count));

    POD5_C_ASSIGN_OR_RAISE(
        auto find_success_count,
        reader->reader->search_for_read_ids(
            search_input,
            gsl::make_span(batch_counts, reader->reader->num_read_record_batches()),
            gsl::make_span(batch_rows, read_id_count)));

    // TODO: on MAJOR_VERSION bump drop this out param and do the check internally.
    *find_success_count_out = find_success_count;

    return POD5_OK;
}

pod5_error_t pod5_get_read_batch_count(size_t * count, Pod5FileReader const * reader)
{
    pod5_reset_error();

    if (!check_file_not_null(reader) || !check_output_pointer_not_null(count)) {
        return g_pod5_error_no;
    }

    *count = reader->reader->num_read_record_batches();
    return POD5_OK;
}

pod5_error_t
pod5_get_read_batch(Pod5ReadRecordBatch ** batch, Pod5FileReader const * reader, size_t index)
{
    pod5_reset_error();

    if (!check_file_not_null(reader) || !check_output_pointer_not_null(batch)) {
        return g_pod5_error_no;
    }

    POD5_C_ASSIGN_OR_RAISE(auto internal_batch, reader->reader->read_read_record_batch(index));

    auto wrapped_batch =
        std::make_unique<Pod5ReadRecordBatch>(std::move(internal_batch), reader->reader);

    *batch = wrapped_batch.release();
    return POD5_OK;
}

pod5_error_t pod5_free_read_batch(Pod5ReadRecordBatch * batch)
{
    pod5_reset_error();

    std::unique_ptr<Pod5ReadRecordBatch> ptr{batch};
    ptr.reset();
    return POD5_OK;
}

pod5_error_t pod5_get_read_batch_row_count(size_t * count, Pod5ReadRecordBatch const * batch)
{
    pod5_reset_error();

    if (!check_not_null(batch) || !check_output_pointer_not_null(count)) {
        return g_pod5_error_no;
    }

    *count = batch->batch.num_rows();
    return POD5_OK;
}

static pod5_error_t check_row_index_and_set_error(size_t row, int64_t batch_size)
{
    if (row > static_cast<size_t>(std::numeric_limits<int64_t>::max())
        || static_cast<int64_t>(row) >= batch_size)
    {
        pod5_set_error(
            arrow::Status::IndexError(
                "Invalid index into batch. Index ", row, " with batch size ", batch_size));
        return g_pod5_error_no;
    }

    return POD5_OK;
}

pod5_error_t pod5_get_read_batch_row_info_data(
    Pod5ReadRecordBatch_t const * batch,
    size_t row,
    uint16_t struct_version,
    void * row_data,
    uint16_t * read_table_version)
{
    pod5_reset_error();

    if (!check_not_null(batch) || !check_output_pointer_not_null(row_data)
        || !check_output_pointer_not_null(read_table_version))
    {
        return g_pod5_error_no;
    }

    static_assert(
        READ_BATCH_ROW_INFO_VERSION == READ_BATCH_ROW_INFO_VERSION_4,
        "New versions must be explicitly loaded");

    auto load_common_v3_v4_fields = [](pod5::ReadTableRecordColumns const & cols,
                                       std::size_t row,
                                       auto * typed_row_data) {
        // Inform the caller of the version of the input table.

        if (check_row_index_and_set_error(row, cols.read_id->length()) != POD5_OK) {
            return g_pod5_error_no;
        }

        auto read_id_val = cols.read_id->Value(row);
        read_id_val.to_c_array(typed_row_data->read_id);

        typed_row_data->read_number = cols.read_number->Value(row);
        typed_row_data->start_sample = cols.start_sample->Value(row);
        typed_row_data->median_before = cols.median_before->Value(row);
        typed_row_data->channel = cols.channel->Value(row);
        typed_row_data->well = cols.well->Value(row);
        auto const & pore_type_col = cols.pore_type->indices();
        typed_row_data->pore_type =
            static_cast<arrow::Int16Array const &>(*pore_type_col).Value(row);
        typed_row_data->calibration_offset = cols.calibration_offset->Value(row);
        typed_row_data->calibration_scale = cols.calibration_scale->Value(row);
        auto const & end_reason_col = cols.end_reason->indices();
        typed_row_data->end_reason =
            static_cast<arrow::Int16Array const &>(*end_reason_col).Value(row);
        typed_row_data->end_reason_forced = cols.end_reason_forced->Value(row);
        auto const & run_info_col = cols.run_info->indices();
        typed_row_data->run_info = static_cast<arrow::Int16Array const &>(*run_info_col).Value(row);
        typed_row_data->num_minknow_events = cols.num_minknow_events->Value(row);
        typed_row_data->tracked_scaling_scale = cols.tracked_scaling_scale->Value(row);
        typed_row_data->tracked_scaling_shift = cols.tracked_scaling_shift->Value(row);
        typed_row_data->predicted_scaling_scale = cols.predicted_scaling_scale->Value(row);
        typed_row_data->predicted_scaling_shift = cols.predicted_scaling_shift->Value(row);
        typed_row_data->num_reads_since_mux_change = cols.num_reads_since_mux_change->Value(row);
        typed_row_data->time_since_mux_change = cols.time_since_mux_change->Value(row);

        typed_row_data->signal_row_count = cols.signal->value_length(row);
        typed_row_data->num_samples = cols.num_samples->Value(row);
        return POD5_OK;
    };

    if (struct_version == READ_BATCH_ROW_INFO_VERSION_3) {
        auto typed_row_data = static_cast<ReadBatchRowInfoV3 *>(row_data);

        POD5_C_ASSIGN_OR_RAISE(auto cols, batch->batch.columns());
        *read_table_version = cols.table_version.as_int();

        auto result = load_common_v3_v4_fields(cols, row, typed_row_data);
        if (result != POD5_OK) {
            return result;
        }
    } else if (struct_version == READ_BATCH_ROW_INFO_VERSION_4) {
        auto typed_row_data = static_cast<ReadBatchRowInfoV4 *>(row_data);

        POD5_C_ASSIGN_OR_RAISE(auto cols, batch->batch.columns());
        *read_table_version = cols.table_version.as_int();

        auto result = load_common_v3_v4_fields(cols, row, typed_row_data);
        if (result != POD5_OK) {
            return result;
        }

        // This is the only difference between v3 and v4.
        typed_row_data->open_pore_level = cols.open_pore_level->Value(row);
    } else {
        pod5_set_error(
            arrow::Status::Invalid("Invalid struct version '", struct_version, "' passed"));
        return g_pod5_error_no;
    }

    return POD5_OK;
}

pod5_error_t pod5_get_signal_row_indices(
    Pod5ReadRecordBatch const * batch,
    size_t row,
    int64_t signal_row_indices_count,
    uint64_t * signal_row_indices)
{
    pod5_reset_error();

    if (!check_not_null(batch) || !check_output_pointer_not_null(signal_row_indices)) {
        return g_pod5_error_no;
    }

    auto const signal_col = batch->batch.signal_column();
    if (check_row_index_and_set_error(row, signal_col->length()) != POD5_OK) {
        return g_pod5_error_no;
    }

    auto const row_data =
        std::static_pointer_cast<arrow::UInt64Array>(signal_col->value_slice(row));

    if (signal_row_indices_count != row_data->length()) {
        pod5_set_error(
            pod5::Status::Invalid(
                "Incorrect number of signal indices, expected ",
                row_data->length(),
                " received ",
                signal_row_indices_count));
        return g_pod5_error_no;
    }

    for (std::int64_t i = 0; i < signal_row_indices_count; ++i) {
        signal_row_indices[i] = row_data->Value(i);
    }

    return POD5_OK;
}

pod5_error_t pod5_get_calibration_extra_info(
    Pod5ReadRecordBatch_t const * batch,
    size_t row,
    CalibrationExtraData_t * calibration_extra_data)
{
    pod5_reset_error();

    if (!check_not_null(batch) || !check_output_pointer_not_null(calibration_extra_data)) {
        return g_pod5_error_no;
    }

    POD5_C_ASSIGN_OR_RAISE(auto cols, batch->batch.columns());

    if (check_row_index_and_set_error(row, cols.calibration_scale->length()) != POD5_OK) {
        return g_pod5_error_no;
    }

    auto scale = cols.calibration_scale->Value(row);
    auto const & run_info_indices = cols.run_info->indices();
    auto const run_info_dict_index =
        static_cast<arrow::Int16Array const &>(*run_info_indices).Value(row);

    POD5_C_ASSIGN_OR_RAISE(
        auto const acquisition_id, batch->batch.get_run_info(run_info_dict_index));
    POD5_C_ASSIGN_OR_RAISE(auto run_info_data, batch->reader->find_run_info(acquisition_id));

    calibration_extra_data->digitisation = run_info_data->adc_max - run_info_data->adc_min + 1;
    calibration_extra_data->range = scale * calibration_extra_data->digitisation;

    return POD5_OK;
}

namespace {

struct RunInfoDataCHelper : public RunInfoDictData {
    struct InternalMapHelper {
        std::vector<char const *> keys;
        std::vector<char const *> values;
    };

    RunInfoDataCHelper(std::shared_ptr<pod5::RunInfoData const> && internal_data_)
    : internal_data(std::move(internal_data_))
    {
        acquisition_id = internal_data->acquisition_id.c_str();
        acquisition_start_time_ms = internal_data->acquisition_start_time;
        adc_max = internal_data->adc_max;
        adc_min = internal_data->adc_min;
        context_tags = map_to_c(internal_data->context_tags, context_tags_helper);
        experiment_name = internal_data->experiment_name.c_str();
        flow_cell_id = internal_data->flow_cell_id.c_str();
        flow_cell_product_code = internal_data->flow_cell_product_code.c_str();
        protocol_name = internal_data->protocol_name.c_str();
        protocol_run_id = internal_data->protocol_run_id.c_str();
        protocol_start_time_ms = internal_data->protocol_start_time;
        sample_id = internal_data->sample_id.c_str();
        sample_rate = internal_data->sample_rate;
        sequencing_kit = internal_data->sequencing_kit.c_str();
        sequencer_position = internal_data->sequencer_position.c_str();
        sequencer_position_type = internal_data->sequencer_position_type.c_str();
        software = internal_data->software.c_str();
        system_name = internal_data->system_name.c_str();
        system_type = internal_data->system_type.c_str();
        tracking_id = map_to_c(internal_data->tracking_id, tracking_id_helper);
    }

    KeyValueData map_to_c(pod5::RunInfoData::MapType const & map, InternalMapHelper & helper)
    {
        helper.keys.reserve(map.size());
        helper.values.reserve(map.size());
        for (auto const & item : map) {
            helper.keys.push_back(item.first.c_str());
            helper.values.push_back(item.second.c_str());
        }

        KeyValueData result;
        result.size = helper.keys.size();
        result.keys = helper.keys.data();
        result.values = helper.values.data();
        return result;
    }

    std::shared_ptr<pod5::RunInfoData const> internal_data;
    InternalMapHelper context_tags_helper;
    InternalMapHelper tracking_id_helper;
};

}  // namespace

pod5_error_t pod5_get_run_info(
    Pod5ReadRecordBatch const * batch,
    int16_t run_info,
    RunInfoDictData ** run_info_data)
{
    pod5_reset_error();

    if (!check_not_null(batch) || !check_output_pointer_not_null(run_info_data)) {
        return g_pod5_error_no;
    }

    POD5_C_ASSIGN_OR_RAISE(auto const acquisition_id, batch->batch.get_run_info(run_info));
    POD5_C_ASSIGN_OR_RAISE(auto internal_data, batch->reader->find_run_info(acquisition_id));

    auto data = std::make_unique<RunInfoDataCHelper>(std::move(internal_data));
    *run_info_data = data.release();
    return POD5_OK;
}

pod5_error_t pod5_get_file_run_info(
    Pod5FileReader_t const * file,
    run_info_index_t run_info_index,
    RunInfoDictData_t ** run_info_data)
{
    pod5_reset_error();

    if (!check_file_not_null(file) || !check_output_pointer_not_null(run_info_data)) {
        return g_pod5_error_no;
    }

    POD5_C_ASSIGN_OR_RAISE(auto internal_data, file->reader->get_run_info(run_info_index));

    auto data = std::make_unique<RunInfoDataCHelper>(std::move(internal_data));
    *run_info_data = data.release();
    return POD5_OK;
}

pod5_error_t pod5_free_run_info(RunInfoDictData_t * run_info_data)
{
    pod5_reset_error();

    std::unique_ptr<RunInfoDataCHelper> helper(static_cast<RunInfoDataCHelper *>(run_info_data));
    helper.reset();

    return POD5_OK;
}

pod5_error_t pod5_release_run_info(RunInfoDictData * run_info_data)
{
    return pod5_free_run_info(run_info_data);
}

pod5_error_t pod5_get_file_run_info_count(
    Pod5FileReader_t const * file,
    run_info_index_t * run_info_count)
{
    pod5_reset_error();

    if (!check_file_not_null(file) || !check_output_pointer_not_null(run_info_count)) {
        return g_pod5_error_no;
    }

    POD5_C_ASSIGN_OR_RAISE(*run_info_count, file->reader->get_run_info_count());

    return POD5_OK;
}

pod5_error_t pod5_get_end_reason(
    Pod5ReadRecordBatch_t const * batch,
    int16_t end_reason,
    pod5_end_reason * end_reason_value,
    char * end_reason_string_value,
    size_t * end_reason_string_value_size)
{
    pod5_reset_error();

    if (!check_not_null(batch) || !check_output_pointer_not_null(end_reason_value)
        || !check_output_pointer_not_null(end_reason_string_value)
        || !check_output_pointer_not_null(end_reason_string_value_size))
    {
        return g_pod5_error_no;
    }

    POD5_C_ASSIGN_OR_RAISE(auto const end_reason_val, batch->batch.get_end_reason(end_reason));
    auto const input_buffer_len = *end_reason_string_value_size;
    *end_reason_string_value_size = end_reason_val.second.size() + 1;
    if (end_reason_val.second.size() >= input_buffer_len) {
        return POD5_ERROR_STRING_NOT_LONG_ENOUGH;
    }

    *end_reason_value = POD5_END_REASON_UNKNOWN;
    switch (end_reason_val.first) {
    case pod5::ReadEndReason::mux_change:
        *end_reason_value = POD5_END_REASON_MUX_CHANGE;
        break;
    case pod5::ReadEndReason::unblock_mux_change:
        *end_reason_value = POD5_END_REASON_UNBLOCK_MUX_CHANGE;
        break;
    case pod5::ReadEndReason::data_service_unblock_mux_change:
        *end_reason_value = POD5_END_REASON_DATA_SERVICE_UNBLOCK_MUX_CHANGE;
        break;
    case pod5::ReadEndReason::signal_positive:
        *end_reason_value = POD5_END_REASON_SIGNAL_POSITIVE;
        break;
    case pod5::ReadEndReason::signal_negative:
        *end_reason_value = POD5_END_REASON_SIGNAL_NEGATIVE;
        break;
    case pod5::ReadEndReason::api_request:
        *end_reason_value = POD5_END_REASON_API_REQUEST;
        break;
    case pod5::ReadEndReason::device_data_error:
        *end_reason_value = POD5_END_REASON_DEVICE_DATA_ERROR;
        break;
    case pod5::ReadEndReason::analysis_config_change:
        *end_reason_value = POD5_END_REASON_ANALYSIS_CONFIG_CHANGE;
        break;
    case pod5::ReadEndReason::paused:
        *end_reason_value = POD5_END_REASON_PAUSED;
        break;
    case pod5::ReadEndReason::unknown:
        *end_reason_value = POD5_END_REASON_UNKNOWN;
        break;
    }

    std::copy(end_reason_val.second.begin(), end_reason_val.second.end(), end_reason_string_value);
    end_reason_string_value[*end_reason_string_value_size] = '\0';
    return POD5_OK;
}

pod5_error_t pod5_get_pore_type(
    Pod5ReadRecordBatch_t const * batch,
    int16_t pore_type,
    char * pore_type_string_value,
    size_t * pore_type_string_value_size)
{
    pod5_reset_error();

    if (!check_not_null(batch) || !check_output_pointer_not_null(pore_type_string_value)
        || !check_output_pointer_not_null(pore_type_string_value_size))
    {
        return g_pod5_error_no;
    }

    POD5_C_ASSIGN_OR_RAISE(auto const pore_type_str, batch->batch.get_pore_type(pore_type));
    auto const input_buffer_len = *pore_type_string_value_size;
    *pore_type_string_value_size = pore_type_str.size() + 1;
    if (pore_type_str.size() >= input_buffer_len) {
        return POD5_ERROR_STRING_NOT_LONG_ENOUGH;
    }

    std::copy(pore_type_str.begin(), pore_type_str.end(), pore_type_string_value);
    pore_type_string_value[*pore_type_string_value_size] = '\0';
    return POD5_OK;
}

namespace {

class SignalRowInfoCHelper : public SignalRowInfo {
public:
    SignalRowInfoCHelper(pod5::SignalTableRecordBatch && b) : batch(std::move(b)) {}

    pod5::SignalTableRecordBatch const batch;
};

}  // namespace

pod5_error_t pod5_get_signal_row_info(
    Pod5FileReader const * reader,
    size_t signal_rows_count,
    uint64_t const * signal_rows,
    SignalRowInfo ** signal_row_info)
{
    pod5_reset_error();

    // Check for a valid reader.
    if (!check_file_not_null(reader)) {
        return g_pod5_error_no;
    }

    // Check for valid inputs.
    if (signal_rows_count == 0) {
        // Nothing to do.
        return POD5_OK;
    } else if (!check_not_null(signal_rows) || !check_output_pointer_not_null(signal_row_info)) {
        return g_pod5_error_no;
    }

    // Sort all rows first, in order to make searching faster.
    std::vector<std::uint64_t> signal_rows_sorted{signal_rows, signal_rows + signal_rows_count};
    std::sort(signal_rows_sorted.begin(), signal_rows_sorted.end());

    // Store allocations to a temporary buffer so that we don't leak them on failure.
    std::vector<std::unique_ptr<SignalRowInfoCHelper>> row_infos(signal_rows_count);

    // Then loop all rows, forward.
    for (std::size_t completed_rows = 0; completed_rows < signal_rows_sorted.size();
         completed_rows++)
    {
        auto const start_row = signal_rows_sorted[completed_rows];

        std::size_t batch_row = 0;
        POD5_C_ASSIGN_OR_RAISE(
            std::size_t row_batch,
            (reader->reader->signal_batch_for_row_id(start_row, &batch_row)));
        POD5_C_ASSIGN_OR_RAISE(auto batch, reader->reader->read_signal_record_batch(row_batch));

        auto output = std::make_unique<SignalRowInfoCHelper>(std::move(batch));

        output->batch_index = start_row;
        output->batch_row_index = batch_row;

        auto samples = output->batch.samples_column();
        output->stored_sample_count = samples->Value(batch_row);
        POD5_C_ASSIGN_OR_RAISE(
            output->stored_byte_count, output->batch.samples_byte_count(batch_row));

        row_infos[completed_rows] = std::move(output);
    }

    // Pass ownership of the info back to the caller.
    for (std::size_t row_idx = 0; row_idx < signal_rows_count; row_idx++) {
        signal_row_info[row_idx] = row_infos[row_idx].release();
    }
    return POD5_OK;
}

pod5_error_t pod5_free_signal_row_info(size_t signal_rows_count, SignalRowInfo_t ** signal_row_info)
{
    pod5_reset_error();

    if (signal_rows_count > 0 && !check_not_null(signal_row_info)) {
        return g_pod5_error_no;
    }

    for (std::size_t i = 0; i < signal_rows_count; ++i) {
        std::unique_ptr<SignalRowInfoCHelper> helper(
            static_cast<SignalRowInfoCHelper *>(signal_row_info[i]));
        helper.reset();
    }
    return POD5_OK;
}

pod5_error_t pod5_get_signal(
    Pod5FileReader const * reader,
    SignalRowInfo_t const * row_info,
    size_t sample_count,
    int16_t * sample_data)
{
    pod5_reset_error();

    if (!check_file_not_null(reader) || !check_not_null(row_info)
        || !check_output_pointer_not_null(sample_data))
    {
        return g_pod5_error_no;
    }

    auto * row_info_data = static_cast<SignalRowInfoCHelper const *>(row_info);

    POD5_C_RETURN_NOT_OK(row_info_data->batch.extract_signal_row(
        row_info->batch_row_index, gsl::make_span(sample_data, sample_count)));

    return POD5_OK;
}

pod5_error_t pod5_get_read_complete_sample_count(
    Pod5FileReader_t const * reader,
    Pod5ReadRecordBatch_t const * batch,
    size_t batch_row,
    size_t * sample_count)
{
    pod5_reset_error();

    if (!check_file_not_null(reader) || !check_not_null(batch)
        || !check_output_pointer_not_null(sample_count))
    {
        return g_pod5_error_no;
    }

    POD5_C_ASSIGN_OR_RAISE(auto const & signal_rows, batch->batch.get_signal_rows(batch_row));

    POD5_C_ASSIGN_OR_RAISE(
        *sample_count,
        reader->reader->extract_sample_count(
            gsl::make_span(signal_rows->raw_values(), signal_rows->length())));
    return POD5_OK;
}

pod5_error_t pod5_get_read_complete_signal(
    Pod5FileReader_t const * reader,
    Pod5ReadRecordBatch_t const * batch,
    size_t batch_row,
    size_t sample_count,
    int16_t * signal)
{
    pod5_reset_error();

    if (!check_file_not_null(reader) || !check_not_null(batch)
        || !check_output_pointer_not_null(signal))
    {
        return g_pod5_error_no;
    }

    POD5_C_ASSIGN_OR_RAISE(auto const & signal_rows, batch->batch.get_signal_rows(batch_row));

    POD5_C_RETURN_NOT_OK(reader->reader->extract_samples(
        gsl::make_span(signal_rows->raw_values(), signal_rows->length()),
        gsl::make_span(signal, sample_count)));
    return POD5_OK;
}

//---------------------------------------------------------------------------------------------------------------------
Pod5FileWriter *
pod5_create_file(char const * filename, char const * writer_name, Pod5WriterOptions const * options)
{
    pod5_reset_error();

    if (!check_string_not_empty(filename) || !check_string_not_empty(writer_name)) {
        return nullptr;
    }

    auto internal_writer =
        pod5::create_file_writer(filename, writer_name, make_internal_writer_options(options));
    if (!internal_writer.ok()) {
        pod5_set_error(internal_writer.status());
        return nullptr;
    }

    auto writer = std::make_unique<Pod5FileWriter>(std::move(*internal_writer));
    return writer.release();
}

pod5_error_t pod5_close_and_free_writer(Pod5FileWriter * file)
{
    pod5_reset_error();

    std::unique_ptr<Pod5FileWriter> ptr{file};
    if (ptr) {
        POD5_C_RETURN_NOT_OK(ptr->writer->close());
    }

    ptr.reset();
    return POD5_OK;
}

pod5_error_t pod5_add_pore(int16_t * pore_index, Pod5FileWriter * file, char const * pore_type)
{
    pod5_reset_error();

    if (!check_string_not_empty(pore_type) || !check_file_not_null(file)
        || !check_output_pointer_not_null(pore_index))
    {
        return g_pod5_error_no;
    }

    POD5_C_ASSIGN_OR_RAISE(*pore_index, file->writer->add_pore_type(pore_type));
    return POD5_OK;
}

pod5_error_t pod5_add_run_info(
    int16_t * run_info_index,
    Pod5FileWriter * file,
    char const * acquisition_id,
    int64_t acquisition_start_time_ms,
    int16_t adc_max,
    int16_t adc_min,
    size_t context_tags_count,
    char const ** context_tags_keys,
    char const ** context_tags_values,
    char const * experiment_name,
    char const * flow_cell_id,
    char const * flow_cell_product_code,
    char const * protocol_name,
    char const * protocol_run_id,
    int64_t protocol_start_time_ms,
    char const * sample_id,
    uint16_t sample_rate,
    char const * sequencing_kit,
    char const * sequencer_position,
    char const * sequencer_position_type,
    char const * software,
    char const * system_name,
    char const * system_type,
    size_t tracking_id_count,
    char const ** tracking_id_keys,
    char const ** tracking_id_values)
{
    pod5_reset_error();

    if (!check_file_not_null(file) || !check_not_null(run_info_index)
        || !check_string_not_empty(acquisition_id) || !check_string_not_empty(experiment_name)
        || !check_string_not_empty(flow_cell_id) || !check_string_not_empty(flow_cell_product_code)
        || !check_string_not_empty(protocol_name) || !check_string_not_empty(protocol_run_id)
        || !check_string_not_empty(sample_id) || !check_string_not_empty(sequencing_kit)
        || !check_string_not_empty(sequencer_position)
        || !check_string_not_empty(sequencer_position_type) || !check_string_not_empty(software)
        || !check_string_not_empty(system_name) || !check_string_not_empty(system_type))
    {
        return g_pod5_error_no;
    }

    auto const parse_map =
        [](std::size_t tracking_id_count,
           char const ** tracking_id_keys,
           char const ** tracking_id_values) -> pod5::Result<pod5::RunInfoData::MapType> {
        if (!check_not_null(tracking_id_keys) || !check_not_null(tracking_id_values)) {
            return arrow::Status::Invalid(g_pod5_error_string);
        }

        pod5::RunInfoData::MapType result;
        for (std::size_t i = 0; i < tracking_id_count; ++i) {
            auto key = tracking_id_keys[i];
            auto value = tracking_id_values[i];
            if (!check_string_not_empty(key) || !check_string_not_empty(value)) {
                return arrow::Status::Invalid(g_pod5_error_string);
            }

            result.emplace_back(key, value);
        }
        return result;
    };

    POD5_C_ASSIGN_OR_RAISE(
        auto const context_tags,
        parse_map(context_tags_count, context_tags_keys, context_tags_values));
    POD5_C_ASSIGN_OR_RAISE(
        auto const tracking_id, parse_map(tracking_id_count, tracking_id_keys, tracking_id_values));

    POD5_C_ASSIGN_OR_RAISE(
        *run_info_index,
        file->writer->add_run_info(
            pod5::RunInfoData(
                acquisition_id,
                acquisition_start_time_ms,
                adc_max,
                adc_min,
                context_tags,
                experiment_name,
                flow_cell_id,
                flow_cell_product_code,
                protocol_name,
                protocol_run_id,
                protocol_start_time_ms,
                sample_id,
                sample_rate,
                sequencing_kit,
                sequencer_position,
                sequencer_position_type,
                software,
                system_name,
                system_type,
                tracking_id)));

    return POD5_OK;
}

static bool check_read_data_struct(std::uint16_t struct_version, void const * row_data)
{
    static_assert(
        READ_BATCH_ROW_INFO_VERSION == READ_BATCH_ROW_INFO_VERSION_4,
        "New versions must be explicitly loaded");

    if (!check_not_null(row_data)) {
        return false;
    }

    if (struct_version < READ_BATCH_ROW_INFO_VERSION_3) {
        pod5_set_error(arrow::Status::Invalid("Unable to write V1 + V2 reads, update to V3 API."));
        return false;
    }

    auto check_common_v3_v4_fields = [](auto typed_row_data) -> bool {
        return check_not_null(typed_row_data->read_id)
               && check_not_null(typed_row_data->read_number)
               && check_not_null(typed_row_data->start_sample)
               && check_not_null(typed_row_data->median_before)
               && check_not_null(typed_row_data->channel) && check_not_null(typed_row_data->well)
               && check_not_null(typed_row_data->pore_type)
               && check_not_null(typed_row_data->calibration_offset)
               && check_not_null(typed_row_data->calibration_scale)
               && check_not_null(typed_row_data->end_reason)
               && check_not_null(typed_row_data->end_reason_forced)
               && check_not_null(typed_row_data->run_info_id)
               && check_not_null(typed_row_data->num_minknow_events)
               && check_not_null(typed_row_data->tracked_scaling_scale)
               && check_not_null(typed_row_data->tracked_scaling_shift)
               && check_not_null(typed_row_data->predicted_scaling_scale)
               && check_not_null(typed_row_data->predicted_scaling_shift)
               && check_not_null(typed_row_data->num_reads_since_mux_change)
               && check_not_null(typed_row_data->time_since_mux_change);
    };

    if (struct_version == READ_BATCH_ROW_INFO_VERSION_3) {
        auto const * typed_row_data = static_cast<ReadBatchRowInfoArrayV3 const *>(row_data);

        if (!check_common_v3_v4_fields(typed_row_data)) {
            return false;
        }
    }

    if (struct_version == READ_BATCH_ROW_INFO_VERSION_4) {
        auto const * typed_row_data = static_cast<ReadBatchRowInfoArrayV4 const *>(row_data);

        if (!check_common_v3_v4_fields(typed_row_data)
            || !check_not_null(typed_row_data->open_pore_level))
        {
            return false;
        }
    }

    return true;
}

static bool load_struct_row_into_read_data(
    std::unique_ptr<pod5::FileWriter> const & writer,
    pod5::ReadData & read_data,
    std::uint16_t struct_version,
    void const * row_data,
    std::uint32_t row_id)
{
    static_assert(
        READ_BATCH_ROW_INFO_VERSION == READ_BATCH_ROW_INFO_VERSION_4,
        "New versions must be explicitly loaded");

    auto load_common_v3_v4_fields = [](std::unique_ptr<pod5::FileWriter> const & writer,
                                       auto const * typed_row_data,
                                       std::uint32_t row_id,
                                       pod5::ReadData & read_data) {
        pod5::Uuid read_id_uuid{typed_row_data->read_id[row_id]};

        std::optional<pod5::ReadEndReason> end_reason_internal;
        switch (typed_row_data->end_reason[row_id]) {
        case POD5_END_REASON_UNKNOWN:
            end_reason_internal = pod5::ReadEndReason::unknown;
            break;
        case POD5_END_REASON_MUX_CHANGE:
            end_reason_internal = pod5::ReadEndReason::mux_change;
            break;
        case POD5_END_REASON_UNBLOCK_MUX_CHANGE:
            end_reason_internal = pod5::ReadEndReason::unblock_mux_change;
            break;
        case POD5_END_REASON_DATA_SERVICE_UNBLOCK_MUX_CHANGE:
            end_reason_internal = pod5::ReadEndReason::data_service_unblock_mux_change;
            break;
        case POD5_END_REASON_SIGNAL_POSITIVE:
            end_reason_internal = pod5::ReadEndReason::signal_positive;
            break;
        case POD5_END_REASON_SIGNAL_NEGATIVE:
            end_reason_internal = pod5::ReadEndReason::signal_negative;
            break;
        case POD5_END_REASON_API_REQUEST:
            end_reason_internal = pod5::ReadEndReason::api_request;
            break;
        case POD5_END_REASON_DEVICE_DATA_ERROR:
            end_reason_internal = pod5::ReadEndReason::device_data_error;
            break;
        case POD5_END_REASON_ANALYSIS_CONFIG_CHANGE:
            end_reason_internal = pod5::ReadEndReason::analysis_config_change;
            break;
        case POD5_END_REASON_PAUSED:
            end_reason_internal = pod5::ReadEndReason::paused;
            break;
        }
        if (!end_reason_internal.has_value()) {
            pod5_set_error(
                arrow::Status::Invalid(
                    "out of range end reason ",
                    typed_row_data->end_reason[row_id],
                    " passed to add read"));
            return false;
        }

        auto const end_reason_index = writer->lookup_end_reason(*end_reason_internal);
        if (!end_reason_index.ok()) {
            pod5_set_error(end_reason_index.status());
            return false;
        }

        read_data = pod5::ReadData{
            read_id_uuid,
            typed_row_data->read_number[row_id],
            typed_row_data->start_sample[row_id],
            typed_row_data->channel[row_id],
            typed_row_data->well[row_id],
            typed_row_data->pore_type[row_id],
            typed_row_data->calibration_offset[row_id],
            typed_row_data->calibration_scale[row_id],
            typed_row_data->median_before[row_id],
            *end_reason_index,
            typed_row_data->end_reason_forced[row_id] != 0,
            typed_row_data->run_info_id[row_id],
            typed_row_data->num_minknow_events[row_id],
            typed_row_data->tracked_scaling_scale[row_id],
            typed_row_data->tracked_scaling_shift[row_id],
            typed_row_data->predicted_scaling_scale[row_id],
            typed_row_data->predicted_scaling_shift[row_id],
            typed_row_data->num_reads_since_mux_change[row_id],
            typed_row_data->time_since_mux_change[row_id],
            // open_pore_level is only present in v4.
            std::numeric_limits<float>::quiet_NaN()};
        return true;
    };

    // Version 0-2 are no longer supported for writing.
    if (struct_version == READ_BATCH_ROW_INFO_VERSION_4) {
        auto const * typed_row_data = static_cast<ReadBatchRowInfoArrayV4 const *>(row_data);

        if (!load_common_v3_v4_fields(writer, typed_row_data, row_id, read_data)) {
            return false;
        }
        read_data.open_pore_level = typed_row_data->open_pore_level[row_id];
    } else if (struct_version == READ_BATCH_ROW_INFO_VERSION_3) {
        auto const * typed_row_data = static_cast<ReadBatchRowInfoArrayV3 const *>(row_data);

        if (!load_common_v3_v4_fields(writer, typed_row_data, row_id, read_data)) {
            return false;
        }
    } else {
        pod5_set_error(
            arrow::Status::Invalid("Invalid writer struct version '", struct_version, "' passed"));
        return false;
    }
    return true;
};

pod5_error_t pod5_add_reads_data(
    Pod5FileWriter_t * file,
    uint32_t read_count,
    uint16_t struct_version,
    void const * row_data,
    int16_t const ** signal,
    uint32_t const * signal_size)
{
    pod5_reset_error();

    if (!check_file_not_null(file)) {
        return g_pod5_error_no;
    }
    if (read_count == 0) {
        return POD5_OK;
    }
    if (!check_read_data_struct(struct_version, row_data) || !check_not_null(signal)
        || !check_not_null(signal_size))
    {
        return g_pod5_error_no;
    }
    for (std::uint32_t read = 0; read < read_count; ++read) {
        if (!check_not_null(signal[read])) {
            return g_pod5_error_no;
        }
    }

    for (std::uint32_t read = 0; read < read_count; ++read) {
        pod5::ReadData read_data;
        if (!load_struct_row_into_read_data(
                file->writer, read_data, struct_version, row_data, read))
        {
            return g_pod5_error_no;
        }

        POD5_C_RETURN_NOT_OK(file->writer->add_complete_read(
            read_data, gsl::make_span(signal[read], signal_size[read])));
    }

    return POD5_OK;
}

pod5_error_t pod5_add_reads_data_pre_compressed(
    Pod5FileWriter_t * file,
    uint32_t read_count,
    uint16_t struct_version,
    void const * row_data,
    char const *** compressed_signal,
    size_t const ** compressed_signal_size,
    uint32_t const ** sample_counts,
    size_t const * signal_chunk_count)
{
    pod5_reset_error();

    if (!check_file_not_null(file)) {
        return g_pod5_error_no;
    }
    if (read_count == 0) {
        return POD5_OK;
    }
    if (!check_read_data_struct(struct_version, row_data) || !check_not_null(compressed_signal)
        || !check_not_null(compressed_signal_size) || !check_not_null(sample_counts)
        || !check_not_null(signal_chunk_count))
    {
        return g_pod5_error_no;
    }
    for (std::uint32_t read = 0; read < read_count; ++read) {
        if (!check_not_null(compressed_signal[read])
            || !check_not_null(compressed_signal_size[read])
            || !check_not_null(sample_counts[read]))
        {
            return g_pod5_error_no;
        }
    }

    for (std::uint32_t read = 0; read < read_count; ++read) {
        pod5::ReadData read_data;
        if (!load_struct_row_into_read_data(
                file->writer, read_data, struct_version, row_data, read))
        {
            return g_pod5_error_no;
        }

        std::uint64_t total_sample_count = 0;
        std::vector<std::uint64_t> signal_rows;
        for (std::size_t i = 0; i < signal_chunk_count[read]; ++i) {
            auto signal = compressed_signal[read][i];
            auto signal_size = compressed_signal_size[read][i];
            auto sample_count = sample_counts[read][i];
            total_sample_count += sample_count;
            POD5_C_ASSIGN_OR_RAISE(
                auto row_id,
                file->writer->add_pre_compressed_signal(
                    read_data.read_id,
                    gsl::make_span(signal, signal_size).as_span<std::uint8_t const>(),
                    sample_count));
            signal_rows.push_back(row_id);
        }

        POD5_C_RETURN_NOT_OK(file->writer->add_complete_read(
            read_data, gsl::make_span(signal_rows), total_sample_count));
    }
    return POD5_OK;
}

size_t pod5_vbz_compressed_signal_max_size(size_t sample_count)
{
    pod5_reset_error();

    auto const compressed_size = pod5::compressed_signal_max_size(sample_count);
    if (!compressed_size.ok()) {
        // TODO: on MAJOR_VERSION bump change this to return an error code.
        pod5_set_error(compressed_size.status());
        return 0;
    } else {
        return compressed_size.ValueUnsafe();
    }
}

pod5_error_t pod5_vbz_compress_signal(
    int16_t const * signal,
    size_t signal_size,
    char * compressed_signal_out,
    size_t * compressed_signal_size)
{
    pod5_reset_error();

    if (!check_not_null(signal) || !check_output_pointer_not_null(compressed_signal_out)
        || !check_output_pointer_not_null(compressed_signal_size))
    {
        return g_pod5_error_no;
    }

    POD5_C_ASSIGN_OR_RAISE(
        auto buffer,
        pod5::compress_signal(gsl::make_span(signal, signal_size), arrow::system_memory_pool()));

    if ((std::size_t)buffer->size() > *compressed_signal_size) {
        pod5_set_error(
            pod5::Status::Invalid(
                "Compressed signal size (",
                buffer->size(),
                ") is greater than provided buffer size (",
                compressed_signal_size,
                ")"));
        return g_pod5_error_no;
    }

    std::copy(buffer->data(), buffer->data() + buffer->size(), compressed_signal_out);
    *compressed_signal_size = buffer->size();

    return POD5_OK;
}

pod5_error_t pod5_vbz_decompress_signal(
    char const * compressed_signal,
    size_t compressed_signal_size,
    size_t sample_count,
    int16_t * signal_out)
{
    pod5_reset_error();

    if (!check_not_null(compressed_signal) || !check_output_pointer_not_null(signal_out)) {
        return g_pod5_error_no;
    }

    auto const in_span =
        gsl::make_span(compressed_signal, compressed_signal_size).as_span<std::uint8_t const>();
    auto out_span = gsl::make_span(signal_out, sample_count);
    POD5_C_RETURN_NOT_OK(pod5::decompress_signal(in_span, arrow::system_memory_pool(), out_span));

    return POD5_OK;
}

pod5_error_t pod5_format_read_id(read_id_t const read_id, char * read_id_string)
{
    pod5_reset_error();

    if (!check_not_null(read_id) || !check_output_pointer_not_null(read_id_string)) {
        return g_pod5_error_no;
    }

    auto * uuid_data = reinterpret_cast<pod5::Uuid const *>(read_id);
    uuid_data->write_to(read_id_string);
    read_id_string[36] = '\0';

    return POD5_OK;
}
}


================================================
FILE: c++/pod5_format/c_api.h
================================================
#pragma once

#include "pod5_format/pod5_format_export.h"

#include <stddef.h>
#include <stdint.h>

#ifdef __cplusplus
extern "C" {
#endif

#ifndef _WIN32
#define POD5_DEPRECATED __attribute__((deprecated))
#elif (__STDC_VERSION__ >= 202000)
#define POD5_DEPRECATED [[deprecated]]
#else
#define POD5_DEPRECATED
#endif

/// All functions are thread safe unless otherwise stated. Types may be used by multiple
/// threads as long as the functions being called only take them by const pointer.

struct Pod5FileReader;
typedef struct Pod5FileReader Pod5FileReader_t;
struct Pod5FileWriter;
typedef struct Pod5FileWriter Pod5FileWriter_t;
struct Pod5ReadRecordBatch;
typedef struct Pod5ReadRecordBatch Pod5ReadRecordBatch_t;

//---------------------------------------------------------------------------------------------------------------------
// Error management
//---------------------------------------------------------------------------------------------------------------------

/// \brief Integer error codes.
/// \note Taken from the arrow status enum.
enum pod5_error {
    POD5_OK = 0,
    POD5_ERROR_OUTOFMEMORY = 1,
    POD5_ERROR_KEYERROR = 2,
    POD5_ERROR_TYPEERROR = 3,
    POD5_ERROR_INVALID = 4,
    POD5_ERROR_IOERROR = 5,
    POD5_ERROR_CAPACITYERROR = 6,
    POD5_ERROR_INDEXERROR = 7,
    POD5_ERROR_CANCELLED = 8,
    POD5_ERROR_UNKNOWNERROR = 9,
    POD5_ERROR_NOTIMPLEMENTED = 10,
    POD5_ERROR_SERIALIZATIONERROR = 11,
    POD5_ERROR_STRING_NOT_LONG_ENOUGH = 12,
};
typedef enum pod5_error pod5_error_t;

/// \brief Get the most recent error number from all pod5 api's on the current thread.
POD5_FORMAT_EXPORT pod5_error_t pod5_get_error_no();
/// \brief Get the most recent error description string from all pod5 api's on the current thread.
/// \note The string's lifetime is internally managed, a caller should not free it.
POD5_FORMAT_EXPORT char const * pod5_get_error_string();

//---------------------------------------------------------------------------------------------------------------------
// Global state
//---------------------------------------------------------------------------------------------------------------------

/// \brief Initialise and register global pod5 types
POD5_FORMAT_EXPORT pod5_error_t pod5_init();
/// \brief Terminate global pod5 types
POD5_FORMAT_EXPORT pod5_error_t pod5_terminate();

//---------------------------------------------------------------------------------------------------------------------
// Shared Structures
//---------------------------------------------------------------------------------------------------------------------

enum pod5_end_reason {
    POD5_END_REASON_UNKNOWN = 0,
    POD5_END_REASON_MUX_CHANGE = 1,
    POD5_END_REASON_UNBLOCK_MUX_CHANGE = 2,
    POD5_END_REASON_DATA_SERVICE_UNBLOCK_MUX_CHANGE = 3,
    POD5_END_REASON_SIGNAL_POSITIVE = 4,
    POD5_END_REASON_SIGNAL_NEGATIVE = 5,
    POD5_END_REASON_API_REQUEST = 6,
    POD5_END_REASON_DEVICE_DATA_ERROR = 7,
    POD5_END_REASON_ANALYSIS_CONFIG_CHANGE = 8,
    POD5_END_REASON_PAUSED = 9
};
typedef enum pod5_end_reason pod5_end_reason_t;

typedef uint16_t run_info_index_t;

typedef uint8_t read_id_t[16];
typedef uint8_t run_id_t[16];

// Single entry of read data:
struct ReadBatchRowInfoV3 {
    // The read id data, in binary form.
    read_id_t read_id;

    // Read number for the read.
    uint32_t read_number;
    // Start sample for the read.
    uint64_t start_sample;
    // Median before level.
    float median_before;

    // Channel for the read.
    uint16_t channel;
    // Well for the read.
    uint8_t well;
    // Dictionary index for the pore type.
    int16_t pore_type;
    // Calibration offset type for the read.
    float calibration_offset;
    // Palibration type for the read.
    float calibration_scale;
    // End reason index for the read.
    int16_t end_reason;
    // Was the end reason for the read forced (0 for false, 1 for true).
    uint8_t end_reason_forced;
    // Dictionary index for run id for the read, can be used to look up run info.
    int16_t run_info;

    // Number of minknow events that the read contains
    uint64_t num_minknow_events;

    // Scale/Shift for tracked read scaling values (based on previous reads)
    // DEPRECATED: will be removed in 0.4.0
    POD5_DEPRECATED float tracked_scaling_scale;
    POD5_DEPRECATED float tracked_scaling_shift;

    // Scale/Shift for predicted read scaling values (based on this read's raw signal)
    // DEPRECATED: will be removed in 0.4.0
    POD5_DEPRECATED float predicted_scaling_scale;
    POD5_DEPRECATED float predicted_scaling_shift;

    // How many reads have been selected prior to this read on the channel-well since it was made active.
    // DEPRECATED: will be removed in 0.4.0
    POD5_DEPRECATED uint32_t num_reads_since_mux_change;
    // How many seconds have passed since the channel-well was made active
    // DEPRECATED: will be removed in 0.4.0
    POD5_DEPRECATED float time_since_mux_change;

    // Number of signal row entries for the read.
    int64_t signal_row_count;

    // The length of the read in samples.
    uint64_t num_samples;
};

// Single entry of read data:
struct ReadBatchRowInfoV4 {
    // The read id data, in binary form.
    read_id_t read_id;

    // Read number for the read.
    uint32_t read_number;
    // Start sample for the read.
    uint64_t start_sample;
    // Median before level.
    float median_before;

    // Channel for the read.
    uint16_t channel;
    // Well for the read.
    uint8_t well;
    // Dictionary index for the pore type.
    int16_t pore_type;
    // Calibration offset type for the read.
    float calibration_offset;
    // Palibration type for the read.
    float calibration_scale;
    // End reason index for the read.
    int16_t end_reason;
    // Was the end reason for the read forced (0 for false, 1 for true).
    uint8_t end_reason_forced;
    // Dictionary index for run id for the read, can be used to look up run info.
    int16_t run_info;

    // Number of minknow events that the read contains
    uint64_t num_minknow_events;

    // Scale/Shift for tracked read scaling values (based on previous reads)
    // DEPRECATED: will be removed in 0.4.0
    POD5_DEPRECATED float tracked_scaling_scale;
    POD5_DEPRECATED float tracked_scaling_shift;

    // Scale/Shift for predicted read scaling values (based on this read's raw signal)
    // DEPRECATED: will be removed in 0.4.0
    POD5_DEPRECATED float predicted_scaling_scale;
    POD5_DEPRECATED float predicted_scaling_shift;

    // How many reads have been selected prior to this read on the channel-well since it was made active.
    // DEPRECATED: will be removed in 0.4.0
    POD5_DEPRECATED uint32_t num_reads_since_mux_change;
    // How many seconds have passed since the channel-well was made active
    // DEPRECATED: will be removed in 0.4.0
    POD5_DEPRECATED float time_since_mux_change;

    // Number of signal row entries for the read.
    int64_t signal_row_count;

    // The length of the read in samples.
    uint64_t num_samples;

    // The level of the pore.
    float open_pore_level;
};

// Typedef for latest batch row info structure.
typedef struct ReadBatchRowInfoV4 ReadBatchRowInfo_t;

struct POD5_DEPRECATED ReadBatchRowInfoArrayV3 {
    // The read id data, in binary form.
    read_id_t const * read_id;

    // Read number for the read.
    uint32_t const * read_number;
    // Start sample for the read.
    uint64_t const * start_sample;
    // Median before level.
    float const * median_before;

    // Channel for the read.
    uint16_t const * channel;
    // Well for the read.
    uint8_t const * well;
    // Pore type for the read.
    int16_t const * pore_type;
    // Calibration offset type for the read.
    float const * calibration_offset;
    // Palibration type for the read.
    float const * calibration_scale;
    // End reason type for the read.
    pod5_end_reason_t const * end_reason;
    // Was the end reason for the read forced (0 for false, 1 for true).
    uint8_t const * end_reason_forced;
    // Run info type for the read.
    int16_t const * run_info_id;

    // Number of minknow events that the read contains
    uint64_t const * num_minknow_events;

    // Scale/Shift for tracked read scaling values (based on previous reads)
    // DEPRECATED: will be removed in 0.4.0
    POD5_DEPRECATED float const * tracked_scaling_scale;
    POD5_DEPRECATED float const * tracked_scaling_shift;

    // Scale/Shift for predicted read scaling values (based on this read's raw signal)
    // DEPRECATED: will be removed in 0.4.0
    POD5_DEPRECATED float const * predicted_scaling_scale;
    POD5_DEPRECATED float const * predicted_scaling_shift;

    // How many reads have been selected prior to this read on the channel-well since it was made active.
    // DEPRECATED: will be removed in 0.4.0
    POD5_DEPRECATED uint32_t const * num_reads_since_mux_change;
    // How many seconds have passed since the channel-well was made active
    // DEPRECATED: will be removed in 0.4.0
    POD5_DEPRECATED float const * time_since_mux_change;
};

// Array of read data:
struct ReadBatchRowInfoArrayV4 {
    // The read id data, in binary form.
    read_id_t const * read_id;

    // Read number for the read.
    uint32_t const * read_number;
    // Start sample for the read.
    uint64_t const * start_sample;
    // Median before level.
    float const * median_before;

    // Channel for the read.
    uint16_t const * channel;
    // Well for the read.
    uint8_t const * well;
    // Pore type for the read.
    int16_t const * pore_type;
    // Calibration offset type for the read.
    float const * calibration_offset;
    // Palibration type for the read.
    float const * calibration_scale;
    // End reason type for the read.
    pod5_end_reason_t const * end_reason;
    // Was the end reason for the read forced (0 for false, 1 for true).
    uint8_t const * end_reason_forced;
    // Run info type for the read.
    int16_t const * run_info_id;

    // Number of minknow events that the read contains
    uint64_t const * num_minknow_events;

    // Scale/Shift for tracked read scaling values (based on previous reads)
    // DEPRECATED: will be removed in 0.4.0
    POD5_DEPRECATED float const * tracked_scaling_scale;
    POD5_DEPRECATED float const * tracked_scaling_shift;

    // Scale/Shift for predicted read scaling values (based on this read's raw signal)
    // DEPRECATED: will be removed in 0.4.0
    POD5_DEPRECATED float const * predicted_scaling_scale;
    POD5_DEPRECATED float const * predicted_scaling_shift;

    // How many reads have been selected prior to this read on the channel-well since it was made active.
    // DEPRECATED: will be removed in 0.4.0
    POD5_DEPRECATED uint32_t const * num_reads_since_mux_change;
    // How many seconds have passed since the channel-well was made active
    // DEPRECATED: will be removed in 0.4.0
    POD5_DEPRECATED float const * time_since_mux_change;

    // The level of the pore.
    float const * open_pore_level;
};

// Typedef for latest batch row info structure.
typedef struct ReadBatchRowInfoArrayV4 ReadBatchRowInfoArray_t;

#define READ_BATCH_ROW_INFO_VERSION_0 0
// Addition of num_minknow_events fields, scaling fields.
#define READ_BATCH_ROW_INFO_VERSION_1 1
// Addition of num_samples fields.
#define READ_BATCH_ROW_INFO_VERSION_2 2
// Flattening of read structures.
#define READ_BATCH_ROW_INFO_VERSION_3 3
// Introduction of new open_pore_level field.
#define READ_BATCH_ROW_INFO_VERSION_4 4
// Latest available version.
#define READ_BATCH_ROW_INFO_VERSION READ_BATCH_ROW_INFO_VERSION_4

//---------------------------------------------------------------------------------------------------------------------
// Reading files
//---------------------------------------------------------------------------------------------------------------------

// Options to control how a file is written.
struct Pod5ReaderOptions {
    /// \brief Disable file mapping into memory. Reduces memory usage of pod5 files, at the expense
    ///        of the underlying arrow file loading into memory on demand.
    char force_disable_file_mapping;
};
typedef struct Pod5ReaderOptions Pod5ReaderOptions_t;

/// \brief Open a file reader with default options.
/// \param filename The filename of the pod5 file.
/// \see pod5_open_file_options
POD5_FORMAT_EXPORT Pod5FileReader_t * pod5_open_file(char const * filename);

/// \brief Open a file reader
/// \param filename         The filename of the pod5 file.
/// \param options          The options to use when opening the file.
/// \return A reader, or null on error. The reason for the error can be queried with
///         pod5_get_error_no() and pod5_get_error_string().
POD5_FORMAT_EXPORT Pod5FileReader_t * pod5_open_file_options(
    char const * filename,
    Pod5ReaderOptions_t const * options);

/// \brief Close a file reader, releasing all memory held by the reader.
/// \param file A previously opened reader.
/// \note Any references to \a file or its components are no longer valid after this call.
/// \note It is safe to call this with a null \a file.
POD5_FORMAT_EXPORT pod5_error_t pod5_close_and_free_reader(Pod5FileReader_t * file);

struct FileInfo {
    read_id_t file_identifier;

    struct Version {
        uint16_t major;
        uint16_t minor;
        uint16_t revision;
    } version;
};
typedef struct FileInfo FileInfo_t;

/// \brief Find info about a file.
/// \param[in]  file        The file to be queried.
/// \param[out] file_info   The info read from the file.
POD5_FORMAT_EXPORT pod5_error_t
pod5_get_file_info(Pod5FileReader_t const * file, FileInfo_t * file_info);

struct EmbeddedFileData {
    // The embedded file name - note this may not be the original file name, if the file has been migrated.
    // This pointer will remain valid until the next pod5 api call on the associated reader.
    char const * file_name;
    size_t offset;
    size_t length;
};
typedef struct EmbeddedFileData EmbeddedFileData_t;

/// \brief Find the location of the read table data
/// \param[in]  file        The file to be queried.
/// \param[out] file_data   The output read table file data.
POD5_FORMAT_EXPORT pod5_error_t
pod5_get_file_read_table_location(Pod5FileReader_t const * file, EmbeddedFileData_t * file_data);

/// \brief Find the location of the signal table data
/// \param[in]  file        The file to be queried.
/// \param[out] file_data   The output signal table file data.
POD5_FORMAT_EXPORT pod5_error_t
pod5_get_file_signal_table_location(Pod5FileReader_t const * file, EmbeddedFileData_t * file_data);

/// \brief Find the location of the run info table data
/// \param[in]  file        The file to be queried.
/// \param[out] file_data   The output signal table file data.
POD5_FORMAT_EXPORT pod5_error_t pod5_get_file_run_info_table_location(
    Pod5FileReader_t const * file,
    EmbeddedFileData_t * file_data);

/// \brief Find the number of reads in the file.
/// \param[in]  reader  The file reader to read from
/// \param[out] count   The number of reads in the file
POD5_FORMAT_EXPORT pod5_error_t
pod5_get_read_count(Pod5FileReader_t const * reader, size_t * count);

/// \brief Grab the read_id's from the file.
/// \param[in]  reader        The file reader to read from.
/// \param      count         The number of read_id's allocated in [read_ids], an error is raised if the count is not greater or equal to pod5_get_read_count.
/// \param[out] read_ids      The read id's written in a contiguous array.
POD5_FORMAT_EXPORT pod5_error_t
pod5_get_read_ids(Pod5FileReader_t const * reader, size_t count, read_id_t * read_ids);

/// \brief Plan the most efficient route through the data for the given read ids
/// \param[in]  file                The file to be queried.
/// \param[in]  read_id_array       The read id array (contiguous array, 16 bytes per id).
/// \param      read_id_count       The number of read ids.
/// \param[out] batch_counts        The number of rows per batch that need to be visited (rows listed in batch_rows),
///                                 input array length should be the number of read table batches.
/// \param[out] batch_rows          Rows to visit per batch, packed into one array. Offsets into this array from
///                                 [batch_counts] provide the per-batch row data. Input array length should
///                                 equal read_id_count.
/// \param[out] find_success_count  The number of requested read ids that were found.
/// \note The output arrays are sorted in file storage order, to improve read efficiency.
POD5_FORMAT_EXPORT pod5_error_t pod5_plan_traversal(
    Pod5FileReader_t const * file,
    uint8_t const * read_id_array,
    size_t read_id_count,
    uint32_t * batch_counts,
    uint32_t * batch_rows,
    size_t * find_success_count);

/// \brief Find the number of read batches in the file.
/// \param[out] count   The number of read batches in the file
/// \param[in]  reader  The file reader to read from
POD5_FORMAT_EXPORT pod5_error_t
pod5_get_read_batch_count(size_t * count, Pod5FileReader_t const * reader);

/// \brief Get a read batch from the file.
/// \param[out] batch   The extracted batch.
/// \param[in]  reader  The file reader to read from
/// \param      index   The index of the batch to read.
/// \note Batches returned from this API must be freed using #pod5_free_read_batch
POD5_FORMAT_EXPORT pod5_error_t
pod5_get_read_batch(Pod5ReadRecordBatch_t ** batch, Pod5FileReader_t const * reader, size_t index);

/// \brief Release a read batch when it is not longer used.
/// \param batch The batch to release.
/// \note Any references to \a batch or its components are no longer valid after this call.
/// \note It is safe to call this with a null \a batch.
POD5_FORMAT_EXPORT pod5_error_t pod5_free_read_batch(Pod5ReadRecordBatch_t * batch);

/// \brief Find the number of rows in a batch.
/// \param[out] count   The number of rows in the batch.
/// \param[in]  batch   The batch to query the number of rows for.
POD5_FORMAT_EXPORT pod5_error_t
pod5_get_read_batch_row_count(size_t * count, Pod5ReadRecordBatch_t const * batch);

/// \brief Find the info for a row in a read batch.
/// \param[in]  batch               The read batch to query.
/// \param      row                 The row index to query.
/// \param      struct_version      The version of the struct being passed in, calling code
///                                 should use [READ_BATCH_ROW_INFO_VERSION].
/// \param[out] row_data            The data for reading into, should be a pointer to ReadBatchRowInfo_t.
/// \param[out] read_table_version  The table version read from the file, will indicate which fields should be available.
///                                 See READ_BATCH_ROW_INFO_VERSION and ReadBatchRowInfo_t above for corresponding fields.
POD5_FORMAT_EXPORT pod5_error_t pod5_get_read_batch_row_info_data(
    Pod5ReadRecordBatch_t const * batch,
    size_t row,
    uint16_t struct_version,
    void * row_data,
    uint16_t * read_table_version);

/// \brief Find the signal indices for a row in a read batch.
/// \param[in]  batch                       The read batch to query.
/// \param      row                         The row index to query.
/// \param      signal_row_indices_count    Number of entries in the signal_row_indices array.
/// \param[out] signal_row_indices          The signal row indices read out of the read row.
/// \note signal_row_indices_count Must equal signal_row_count returned from pod5_get_read_batch_row_info_data
///       or an error is generated.
POD5_FORMAT_EXPORT pod5_error_t pod5_get_signal_row_indices(
    Pod5ReadRecordBatch_t const * batch,
    size_t row,
    int64_t signal_row_indices_count,
    uint64_t * signal_row_indices);

struct CalibrationExtraData {
    // The digitisation value used by the sequencer, equal to:
    //
    // adc_max - adc_min + 1
    uint16_t digitisation;
    // The range of the calibrated channel in pA.
    float range;
};
typedef struct CalibrationExtraData CalibrationExtraData_t;

/// \brief Find the extra calibration info for a row in a read batch.
/// \param[in]  batch                   The read batch to query.
/// \param      row                     The read row index.
/// \param[out] calibration_extra_data  Output location for the calibration data.
/// \note The values are computed from data held in the file, and written directly to the address provided, there is no need to release any data.
POD5_FORMAT_EXPORT pod5_error_t pod5_get_calibration_extra_info(
    Pod5ReadRecordBatch_t const * batch,
    size_t row,
    CalibrationExtraData_t * calibration_extra_data);

struct KeyValueData {
    size_t size;
    char const ** keys;
    char const ** values;
};

struct RunInfoDictData {
    char const * acquisition_id;
    int64_t acquisition_start_time_ms;
    int16_t adc_max;
    int16_t adc_min;
    struct KeyValueData context_tags;
    char const * experiment_name;
    char const * flow_cell_id;
    char const * flow_cell_product_code;
    char const * protocol_name;
    char const * protocol_run_id;
    int64_t protocol_start_time_ms;
    char const * sample_id;
    uint16_t sample_rate;
    char const * sequencing_kit;
    char const * sequencer_position;
    char const * sequencer_position_type;
    char const * software;
    char const * system_name;
    char const * system_type;
    struct KeyValueData tracking_id;
};
typedef struct RunInfoDictData RunInfoDictData_t;

/// \brief Find the run info for a row in a read batch.
/// \param[in]  batch               The read batch to query.
/// \param      run_info            The run info index to query from the passed batch.
/// \param[out] run_info_data       Output location for the run info data.
/// \note The returned run_info value should be released using pod5_free_run_info when it is no longer used.
POD5_FORMAT_EXPORT pod5_error_t pod5_get_run_info(
    Pod5ReadRecordBatch_t const * batch,
    int16_t run_info,
    RunInfoDictData_t ** run_info_data);

/// \brief Find the run info for a row in a file.
/// \param[in]  file                The file to query.
/// \param      run_info_index      The run info index to query from the passed file.
/// \param[out] run_info_data       Output location for the run info data.
/// \note The returned run_info value should be released using pod5_free_run_info when it is no longer used.
POD5_FORMAT_EXPORT pod5_error_t pod5_get_file_run_info(
    Pod5FileReader_t const * file,
    run_info_index_t run_info_index,
    RunInfoDictData_t ** run_info_data);

/// \brief Release a RunInfoDictData struct after use.
/// \param run_info_data The run info to release.
/// \note Any references to \a run_info_data or its components are no longer valid after this call.
/// \note It is safe to call this with a null \a run_info_data.
POD5_FORMAT_EXPORT pod5_error_t pod5_free_run_info(RunInfoDictData_t * run_info_data);

/// \brief Release a RunInfoDictData struct after use.
/// \deprecated
POD5_FORMAT_EXPORT POD5_DEPRECATED pod5_error_t
pod5_release_run_info(RunInfoDictData_t * run_info_data);

/// \brief Find the run info for a row in a read file.
/// \param[in]  file                The file to query.
/// \param[out] run_info_count      The number of run info's that are present in they queried file
POD5_FORMAT_EXPORT pod5_error_t
pod5_get_file_run_info_count(Pod5FileReader_t const * file, run_info_index_t * run_info_count);

/// \brief Find the end reason for a row in a read batch.
/// \param[in]      batch                           The read batch to query.
/// \param          end_reason                      The end reason index to query from the passed batch.
/// \param[out]     end_reason_value                The enum value for end reason.
/// \param[out]     end_reason_string_value         Output location for the string value for the end reason.
/// \param[in,out]  end_reason_string_value_size    Size of [end_reason_string_value], the number of characters written (including 1 for null character) is placed in this value on return.
/// \note If the string input is not long enough POD5_ERROR_STRING_NOT_LONG_ENOUGH is returned.
POD5_FORMAT_EXPORT pod5_error_t pod5_get_end_reason(
    Pod5ReadRecordBatch_t const * batch,
    int16_t end_reason,
    pod5_end_reason_t * end_reason_value,
    char * end_reason_string_value,
    size_t * end_reason_string_value_size);

/// \brief Find the pore type for a row in a read batch.
/// \param[in]      batch                           The read batch to query.
/// \param          pore_type                       The pore type index to query from the passed batch.
/// \param[out]     pore_type_string_value          Output location for the string value for the pore type.
/// \param[in,out]  pore_type_string_value_size     Size of [pore_type_string_value], the number of characters written (including 1 for null character) is placed in this value on return.
/// \note If the string input is not long enough POD5_ERROR_STRING_NOT_LONG_ENOUGH is returned.
POD5_FORMAT_EXPORT pod5_error_t pod5_get_pore_type(
    Pod5ReadRecordBatch_t const * batch,
    int16_t pore_type,
    char * pore_type_string_value,
    size_t * pore_type_string_value_size);

struct SignalRowInfo {
    size_t batch_index;
    size_t batch_row_index;
    uint32_t stored_sample_count;
    size_t stored_byte_count;
};
typedef struct SignalRowInfo SignalRowInfo_t;

/// \brief Find the info for a signal row in a reader.
/// \param[in]  reader                      The reader to query.
/// \param      signal_rows_count           The number of signal rows to query.
/// \param[in]  signal_rows                 The signal rows to query.
/// \param[out] signal_row_info             Pointers to the output signal row information (must be an array of size signal_rows_count)
POD5_FORMAT_EXPORT pod5_error_t pod5_get_signal_row_info(
    Pod5FileReader_t const * reader,
    size_t signal_rows_count,
    uint64_t const * signal_rows,
    SignalRowInfo_t ** signal_row_info);

/// \brief Release a list of signal row infos allocated by [pod5_get_signal_row_info].
/// \param      signal_rows_count           The number of signal rows to release.
/// \param      signal_row_info             The signal row infos to release.
/// \note Calls to pod5_free_signal_row_info must be 1:1 with [pod5_get_signal_row_info], you cannot free part of the returned data.
POD5_FORMAT_EXPORT pod5_error_t
pod5_free_signal_row_info(size_t signal_rows_count, SignalRowInfo_t ** signal_row_info);

/// \brief Find the info for a signal row in a reader.
/// \param[in]  reader          The reader to query.
/// \param[in]  row_info        The signal row info batch index to query data for.
/// \param      sample_count    The number of samples allocated in [sample_data] (must equal the length of signal data in the row).
/// \param[out] sample_data     The output location for the queried samples.
/// \note The signal data is allocated by the caller and should be released as appropriate by the caller.
/// \todo MAJOR_VERSION Rename to include "chunk" or "row" or similar to indicate this gets only part of read signal.
POD5_FORMAT_EXPORT pod5_error_t pod5_get_signal(
    Pod5FileReader_t const * reader,
    SignalRowInfo_t const * row_info,
    size_t sample_count,
    int16_t * sample_data);

/// \brief Find the sample count for a full read.
/// \param[in]  reader          The reader to query.
/// \param[in]  batch           The read batch to query.
/// \param      batch_row       The read row to query data for.
/// \param[out] sample_count    The number of samples in the read - including all chunks of raw data.
POD5_FORMAT_EXPORT pod5_error_t pod5_get_read_complete_sample_count(
    Pod5FileReader_t const * reader,
    Pod5ReadRecordBatch_t const * batch,
    size_t batch_row,
    size_t * sample_count);

/// \brief Find the signal for a full read.
/// \param[in]  reader          The reader to query.
/// \param[in]  batch           The read batch to query.
/// \param      batch_row       The read row to query data for.
/// \param      sample_count    The number of samples allocated in [signal] (must equal the length of signal data in the queryied read row).
/// \param[out] signal          The output location for the queried samples.
/// \note The signal data is allocated by the caller and should be released as appropriate by the caller.
POD5_FORMAT_EXPORT pod5_error_t pod5_get_read_complete_signal(
    Pod5FileReader_t const * reader,
    Pod5ReadRecordBatch_t const * batch,
    size_t batch_row,
    size_t sample_count,
    int16_t * signal);

//---------------------------------------------------------------------------------------------------------------------
// Writing files
//---------------------------------------------------------------------------------------------------------------------

// Signal compression options.
enum CompressionOption {
    /// \brief Use the default signal compression option.
    DEFAULT_SIGNAL_COMPRESSION = 0,
    /// \brief Use vbz to compress read signals in tables.
    VBZ_SIGNAL_COMPRESSION = 1,
    /// \brief Write signals uncompressed to tables.
    UNCOMPRESSED_SIGNAL = 2,
};

// Options to control how a file is written.
struct Pod5WriterOptions {
    /// \brief Maximum number of samples to place in one signal record in the signals table.
    /// \note Use zero to use default value.
    uint32_t max_signal_chunk_size;
    /// \brief Signal type to write to the signals table.
    /// \note Use 'DEFAULT_SIGNAL_COMPRESSION' to use default value.
    int8_t signal_compression_type;

    /// \brief The size of each batch written for the signal table (zero for default).
    size_t signal_table_batch_size;
    /// \brief The size of each batch written for the reads table (zero for default).
    size_t read_table_batch_size;
};
typedef struct Pod5WriterOptions Pod5WriterOptions_t;

/// \brief Create a new pod5 file using specified filenames and options.
/// \param filename         The filename of the pod5 file.
/// \param writer_name      A descriptive string for the user software writing this file.
/// \param options          Options controlling how the file will be written.
/// \return A writer, or null on error. The reason for the error can be queried with
///         pod5_get_error_no() and pod5_get_error_string().
POD5_FORMAT_EXPORT Pod5FileWriter_t * pod5_create_file(
    char const * filename,
    char const * writer_name,
    Pod5WriterOptions_t const * options);

/// \brief Close a file writer, releasing all memory held by the writer.
/// \param file A previously opened writer.
/// \note Any references to \a file or its components are no longer valid after this call.
/// \note It is safe to call this with a null \a file.
POD5_FORMAT_EXPORT pod5_error_t pod5_close_and_free_writer(Pod5FileWriter_t * file);

/// \brief Add a new pore type to the file.
/// \param[out] pore_index  The index of the added pore.
/// \param      file        The file to add the new pore type to.
/// \param      pore_type   The pore type string for the pore.
POD5_FORMAT_EXPORT pod5_error_t
pod5_add_pore(int16_t * pore_index, Pod5FileWriter_t * file, char const * pore_type);

/// \brief Add a new run info to the file, containing tracking information about a sequencing run.
/// \param[out] run_info_index              The index of the added run_info.
/// \param      file                        The file to add the new pore type to.
/// \param      acquisition_id              The offset parameter for the calibration.
/// \param      acquisition_start_time_ms   Milliseconds after unix epoch when the acquisition was started.
/// \param      adc_max                     Maximum ADC value supported by this hardware.
/// \param      adc_min                     Minimum ADC value supported by this hardware.
/// \param      context_tags_count          Number of entries in the context tags map.
/// \param      context_tags_keys           Array of strings used as keys into the context tags map (must have context_tags_count entries).
/// \param      context_tags_values         Array of strings used as values in the context tags map (must have context_tags_count entries).
/// \param      experiment_name             Name given by the user to the group including this protocol.
/// \param      flow_cell_id                Id for the flow cell used in the run.
/// \param      flow_cell_product_code      Product code for the flow cell used in the run.
/// \param      protocol_name               Name given by the user to the protocol.
/// \param      protocol_run_id             Run id for the protocol.
/// \param      protocol_start_time_ms      Milliseconds after unix epoch when the protocol was started.
/// \param      sample_id                   Name given by the user for sample id.
/// \param      sample_rate                 Sample rate of the run.
/// \param      sequencing_kit              Sequencing kit used in the run.
/// \param      sequencer_position          Sequencer position used in the run.
/// \param      sequencer_position_type     Sequencer position type used in the run.
/// \param      software                    Name of the software used to produce the run.
/// \param      system_name                 Name of the system used to produce the run.
/// \param      system_type                 Type of the system used to produce the run.
/// \param      tracking_id_count           Number of entries in the tracking id map.
/// \param      tracking_id_keys            Array of strings used as keys into the tracking id map (must have tracking_id_count entries).
/// \param      tracking_id_values          Array of strings used as values in the tracking id map (must have tracking_id_count entries).
POD5_FORMAT_EXPORT pod5_error_t pod5_add_run_info(
    int16_t * run_info_index,
    Pod5FileWriter_t * file,
    char const * acquisition_id,
    int64_t acquisition_start_time_ms,
    int16_t adc_max,
    int16_t adc_min,
    size_t context_tags_count,
    char const ** context_tags_keys,
    char const ** context_tags_values,
    char const * experiment_name,
    char const * flow_cell_id,
    char const * flow_cell_product_code,
    char const * protocol_name,
    char const * protocol_run_id,
    int64_t protocol_start_time_ms,
    char const * sample_id,
    uint16_t sample_rate,
    char const * sequencing_kit,
    char const * sequencer_position,
    char const * sequencer_position_type,
    char const * software,
    char const * system_name,
    char const * system_type,
    size_t tracking_id_count,
    char const ** tracking_id_keys,
    char const ** tracking_id_values);

/// \brief Add a read to the file.
///
/// For each read `r`, where `0 <= r < read_count`:
/// - `row_data->field[r]` describes a field of the read metadata
/// - `signal[r]` is the raw signal data for the read
/// - `signal_size[r]` is the length of `signal[r]` (in samples, not in bytes)
///
/// \param      file            The file to add the reads to.
/// \param      read_count      The number of reads to add with this call.
/// \param      struct_version  The version of the struct of [row_data] being filled, use READ_BATCH_ROW_INFO_VERSION.
/// \param      row_data        The array data for injecting into the file, should be ReadBatchRowInfoArray_t.
///                             All fields of the array must have length [read_count].
/// \param      signal          The signal data for the reads.
/// \param      signal_size     The number of samples in the signal data.
///                             This must be an array of length [read_count].
POD5_FORMAT_EXPORT pod5_error_t pod5_add_reads_data(
    Pod5FileWriter_t * file,
    uint32_t read_count,
    uint16_t struct_version,
    void const * row_data,
    int16_t const ** signal,
    uint32_t const * signal_size);

/// \brief Add a read to the file, with pre compressed signal chunk sections.
///
/// Consider using the simpler [pod5_add_reads_data] unless you have performance requirements that demand
/// more control over compression and chunking.
///
/// Data should be compressed using [pod5_vbz_compress_signal].
///
/// For each read `r`, where `0 <= r < read_count`:
/// - `row_data->field[r]` describes a field of the read metadata
/// - `signal_chunk_count[r]` is the number of signal chunks
/// - for each signal chunk `i` where `0 <= i < signal_chunk_count[r]`:
///   - `sample_counts[r][i]` is the number of samples in the chunk (ie: the size of the uncompressed data in
///     samples, not in bytes)
///   - `compressed_signal[r][i]` is the compressed data
///   - `compressed_signal_size[r][i]` is the length of the compressed data at `compressed_signal[r][i]`
///
/// \param      file                    The file to add the read to.
/// \param      read_count              The number of reads to add with this call.
/// \param      struct_version          The version of the struct of [row_data] being filled, use READ_BATCH_ROW_INFO_VERSION.
/// \param      row_data                The array data for injecting into the file, should be ReadBatchRowInfoArray_t.
///                                     All fields of the array must have length [read_count].
/// \param      compressed_signal       The signal chunks data for the read.
/// \param      compressed_signal_size  The sizes (in bytes) of each signal chunk.
/// \param      sample_counts           The number of samples of each signal chunk. In other words, it is the *uncompressed* size of the
///                                     corresponding [compressed_signal] array, in samples (not bytes!).
/// \param      signal_chunk_count      The number of sections of compressed signal.
///                                     This must be an array of length [read_count].
POD5_FORMAT_EXPORT pod5_error_t pod5_add_reads_data_pre_compressed(
    Pod5FileWriter_t * file,
    uint32_t read_count,
    uint16_t struct_version,
    void const * row_data,
    char const *** compressed_signal,
    size_t const ** compressed_signal_size,
    uint32_t const ** sample_counts,
    size_t const * signal_chunk_count);

/// \brief Find the max size of a compressed array of samples.
/// \param sample_count The number of samples in the source signal.
/// \return The max number of bytes required for the compressed signal, or 0 on error.
///         The reason for the error can be queried with pod5_get_error_no() and
///         pod5_get_error_string().
POD5_FORMAT_EXPORT size_t pod5_vbz_compressed_signal_max_size(size_t sample_count);

/// \brief VBZ compress an array of samples.
/// \param          signal                      The signal to compress.
/// \param          signal_size                 The number of samples to compress.
/// \param[out]     compressed_signal_out       The compressed signal.
/// \param[in,out]  compressed_signal_size      The number of compressed bytes, should be set to the size of compressed_signal_out on call.
POD5_FORMAT_EXPORT pod5_error_t pod5_vbz_compress_signal(
    int16_t const * signal,
    size_t signal_size,
    char * compressed_signal_out,
    size_t * compressed_signal_size);

/// \brief VBZ decompress an array of samples.
/// \param          compressed_signal           The signal to decompress.
/// \param          compressed_signal_size      The number of compressed bytes, ie the size of compressed_signal in bytes.
/// \param          sample_count                The number of samples to decompress, ie the size of signal_out in samples.
/// \param[out]     signal_out                  The decompressed signal.
POD5_FORMAT_EXPORT pod5_error_t pod5_vbz_decompress_signal(
    char const * compressed_signal,
    size_t compressed_signal_size,
    size_t sample_count,
    int16_t * signal_out);

//---------------------------------------------------------------------------------------------------------------------
// Global state
//---------------------------------------------------------------------------------------------------------------------

/// \brief Format a packed binary read id as a readable read id string:
/// \param          read_id           A 16 byte binary formatted UUID.
/// \param[out]     read_id_string    Output string containing the string formatted UUID (expects a string of at least 37 bytes, one null byte is written.)
POD5_FORMAT_EXPORT pod5_error_t pod5_format_read_id(read_id_t const read_id, char * read_id_string);

#ifdef __cplusplus
}
#endif


================================================
FILE: c++/pod5_format/dictionary_writer.h
================================================
#pragma once

#include "pod5_format/pod5_format_export.h"
#include "pod5_format/result.h"

namespace arrow {
class Array;
}

namespace pod5 {

class POD5_FORMAT_EXPORT DictionaryWriter {
public:
    virtual ~DictionaryWriter() = default;

    pod5::Result<std::shared_ptr<arrow::Array>> build_dictionary_array(
        std::shared_ptr<arrow::Array> const & indices);
    virtual pod5::Result<std::shared_ptr<arrow::Array>> get_value_array() = 0;
    virtual std::size_t item_count() = 0;

    bool is_valid(std::size_t value) { return value < item_count(); }
};

}  // namespace pod5


================================================
FILE: c++/pod5_format/expandable_buffer.h
================================================
#pragma once

#include <arrow/buffer.h>
#include <arrow/result.h>
#include <gsl/gsl-lite.hpp>

#include <cassert>

namespace pod5 {

template <typename T>
class ExpandableBuffer {
public:
    static constexpr int EXPANSION_FACTOR = 2;

    ExpandableBuffer(arrow::MemoryPool * pool = nullptr) { m_pool = pool; }

    arrow::Status init_buffer(arrow::MemoryPool * pool)
    {
        m_pool = pool;
        return clear();
    }

    std::size_t size() const
    {
        if (!m_buffer) {
            return 0;
        }
        return m_buffer->size() / sizeof(T);
    }

    std::uint8_t * mutable_data() { return m_buffer->mutable_data(); }

    std::shared_ptr<arrow::Buffer> get_buffer() const { return m_buffer; }

    arrow::Status clear()
    {
        if (!m_buffer || m_buffer.use_count() > 1) {
            ARROW_ASSIGN_OR_RAISE(m_buffer, arrow::AllocateResizableBuffer(0, m_pool));
            return arrow::Status::OK();
        } else {
            return m_buffer->Resize(0, false);
        }
    }

    gsl::span<T const> get_data_span() const
    {
        if (!m_buffer) {
            return {};
        }

        return gsl::make_span(m_buffer->data(), m_buffer->size()).template as_span<T const>();
    }

    /// \brief Append an object where you don't know the size up front.
    /// \param max_size The maximum possible size of the object to append.
    /// \param append_fn A function that appends the object to the buffer.
    template <typename Callable>
    arrow::Status append(std::size_t max_size, Callable append_fn)
    {
        auto const old_size = m_buffer->size();
        ARROW_RETURN_NOT_OK(reserve(old_size + max_size));
        auto const potential_buffer = gsl::make_span(m_buffer->mutable_data() + old_size, max_size);
        ARROW_ASSIGN_OR_RAISE(auto final_size, append_fn(potential_buffer));
        assert(final_size < max_size);
        return resize(old_size + final_size);
    }

    arrow::Status append(T const & new_value)
    {
        auto const bytes_span =
            gsl::make_span(&new_value, 1).template as_span<std::uint8_t const>();

        return append_bytes(bytes_span);
    }

    arrow::Status append_array(gsl::span<T const> const & new_value_span)
    {
        auto const bytes_span = new_value_span.template as_span<std::uint8_t const>();

        return append_bytes(bytes_span);
    }

    arrow::Status resize(std::int64_t new_size)
    {
        ARROW_RETURN_NOT_OK(reserve(new_size));
        return m_buffer->Resize(new_size, false);
    }

    arrow::Status reserve(std::int64_t new_capacity)
    {
        assert(m_buffer);
        auto const old_size = m_buffer->size();
        if (m_buffer.use_count() > 1) {
            std::shared_ptr<arrow::ResizableBuffer> buffer;
            ARROW_ASSIGN_OR_RAISE(buffer, arrow::AllocateResizableBuffer(old_size, m_pool));

            std::copy(m_buffer->data(), m_buffer->data() + old_size, buffer->mutable_data());
            std::swap(m_buffer, buffer);
        }

        if (new_capacity > m_buffer->capacity()) {
            ARROW_RETURN_NOT_OK(m_buffer->Reserve(new_capacity * EXPANSION_FACTOR));
        }
        return arrow::Status::OK();
    }

private:
    arrow::Status append_bytes(gsl::span<std::uint8_t const> const & bytes_span)
    {
        auto old_size = 0;
        if (!m_buffer) {
            ARROW_ASSIGN_OR_RAISE(
                m_buffer, arrow::AllocateResizableBuffer(bytes_span.size(), m_pool));
        } else {
            old_size = m_buffer->size();
        }
        auto const new_size = old_size + bytes_span.size();
        ARROW_RETURN_NOT_OK(reserve(new_size));

        ARROW_RETURN_NOT_OK(m_buffer->Resize(new_size, false));
        std::copy(bytes_span.begin(), bytes_span.end(), m_buffer->mutable_data() + old_size);
        return arrow::Status::OK();
    }

    std::shared_ptr<arrow::ResizableBuffer> m_buffer;
    arrow::MemoryPool * m_pool = nullptr;
};

}  // namespace pod5


================================================
FILE: c++/pod5_format/file_output_stream.h
================================================
#pragma once

#include <arrow/io/file.h>
#include <arrow/status.h>

namespace pod5 {

class FileOutputStream : public arrow::io::OutputStream {
public:
    virtual arrow::Status batch_complete() { return arrow::Status::OK(); }

    virtual void set_file_start_offset(std::size_t val) {}
};

}  // namespace pod5


================================================
FILE: c++/pod5_format/file_reader.cpp
================================================
#include "pod5_format/file_reader.h"

#include "pod5_format/internal/combined_file_utils.h"
#include "pod5_format/memory_pool.h"
#include "pod5_format/migration/migration.h"
#include "pod5_format/read_table_reader.h"
#include "pod5_format/run_info_table_reader.h"
#include "pod5_format/signal_table_reader.h"

#include <arrow/io/concurrency.h>
#include <arrow/io/file.h>
#include <arrow/ipc/reader.h>

#include <cstdint>
#include <iostream>
#if defined(__APPLE__) || defined(__linux__) || defined(__unix__)
#include <sys/stat.h>
#endif

namespace pod5 {

namespace {
#if defined(__APPLE__) || defined(__linux__) || defined(__unix__)
constexpr std::uint64_t kStatBlockBytes = S_BLKSIZE;
// Issue warning if the majority of the file is missing to avoid false positives
constexpr double kMinMissingFractionThreshold = 0.8;

void warn_if_stat_size_and_blocks_differ_significantly(std::string const & path)
{
    struct stat file_stat = {};
    if (::stat(path.c_str(), &file_stat) != 0 || file_stat.st_size <= 0 || file_stat.st_blocks < 0)
    {
        return;
    }

    auto const logical_size_bytes = static_cast<std::uint64_t>(file_stat.st_size);
    auto const allocated_size_bytes =
        static_cast<std::uint64_t>(file_stat.st_blocks) * kStatBlockBytes;

    if (allocated_size_bytes >= logical_size_bytes) {
        return;
    }

    auto const missing_bytes = logical_size_bytes - allocated_size_bytes;
    auto const missing_fraction =
        static_cast<double>(missing_bytes) / static_cast<double>(logical_size_bytes);
    if (missing_fraction < kMinMissingFractionThreshold) {
        return;
    }

    std::cerr << "Warning: POD5 file '" << path << "' has st_size=" << logical_size_bytes
              << " bytes but only approximately " << allocated_size_bytes
              << " bytes allocated via st_blocks. The file may be sparse or offloaded and "
                 "open/read operations may fail."
              << std::endl;
}
#else
void warn_if_stat_size_and_blocks_differ_significantly(std::string const &) {}
#endif
}  // namespace

FileReaderOptions::FileReaderOptions()
: m_memory_pool(pod5::default_memory_pool())
, m_max_cached_signal_table_batches(DEFAULT_MAX_CACHED_SIGNAL_TABLE_BATCHES)
{
}

void FileReaderOptions::set_max_cached_signal_table_batches(
    std::size_t max_cached_signal_table_batches)
{
    m_max_cached_signal_table_batches = max_cached_signal_table_batches;
}

inline FileLocation make_file_locaton(combined_file_utils::ParsedFileInfo const & parsed_file_info)
{
    return FileLocation{
        parsed_file_info.file_path,
        std::size_t(parsed_file_info.file_start_offset),
        std::size_t(parsed_file_info.file_length)};
}

class FileReaderImpl : public FileReader {
public:
    FileReaderImpl(
        Version const & file_version_pre_migration,
        MigrationResult && migration_result,
        RunInfoTableReader && run_info_table_reader,
        ReadTableReader && read_table_reader,
        SignalTableReader && signal_table_reader)
    : m_file_version_pre_migration(file_version_pre_migration)
    , m_migration_result(std::move(migration_result))
    , m_run_info_table_location(make_file_locaton(m_migration_result.footer().run_info_table))
    , m_read_table_location(make_file_locaton(m_migration_result.footer().reads_table))
    , m_signal_table_location(make_file_locaton(m_migration_result.footer().signal_table))
    , m_run_info_table_reader(std::move(run_info_table_reader))
    , m_read_table_reader(std::move(read_table_reader))
    , m_signal_table_reader(std::move(signal_table_reader))
    {
    }

    SchemaMetadataDescription schema_metadata() const override
    {
        return m_read_table_reader.schema_metadata();
    }

    Result<std::size_t> run_info_count() const override
    {
        return m_run_info_table_reader.CountRows();
    }

    virtual Result<std::size_t> read_count() const override
    {
        auto const batch_count = num_read_record_batches();
        if (batch_count == 0) {
            return 0;
        }

        ARROW_ASSIGN_OR_RAISE(auto const first_batch, read_read_record_batch(0));
        ARROW_ASSIGN_OR_RAISE(auto const last_batch, read_read_record_batch(batch_count - 1));

        return (batch_count - 1) * first_batch.num_rows() + last_batch.num_rows();
    }

    Result<ReadTableRecordBatch> read_read_record_batch(std::size_t i) const override
    {
        return m_read_table_reader.read_record_batch(i);
    }

    std::size_t num_read_record_batches() const override
    {
        return m_read_table_reader.num_record_batches();
    }

    Result<std::size_t> search_for_read_ids(
        ReadIdSearchInput const & search_input,
        gsl::span<uint32_t> const & batch_counts,
        gsl::span<uint32_t> const & batch_rows) const override
    {
        return m_read_table_reader.search_for_read_ids(search_input, batch_counts, batch_rows);
    }

    Result<SignalTableRecordBatch> read_signal_record_batch(std::size_t i) const override
    {
        return m_signal_table_reader.read_record_batch(i);
    }

    std::size_t num_signal_record_batches() const override
    {
        return m_signal_table_reader.num_record_batches();
    }

    Result<std::size_t> signal_batch_for_row_id(std::size_t row, std::size_t * batch_row)
        const override
    {
        return m_signal_table_reader.signal_batch_for_row_id(row, batch_row);
    }

    Result<std::size_t> extract_sample_count(
        gsl::span<std::uint64_t const> const & row_indices) const override
    {
        return m_signal_table_reader.extract_sample_count(row_indices);
    }

    Status extract_samples(
        gsl::span<std::uint64_t const> const & row_indices,
        gsl::span<std::int16_t> const & output_samples) const override
    {
        return m_signal_table_reader.extract_samples(row_indices, output_samples);
    }

    Result<std::vector<std::shared_ptr<arrow::Buffer>>> extract_samples_inplace(
        gsl::span<std::uint64_t const> const & row_indices,
        std::vector<std::uint32_t> & sample_count) const override
    {
        return m_signal_table_reader.extract_samples_inplace(row_indices, sample_count);
    }

    FileLocation const & run_info_table_location() const override
    {
        return m_run_info_table_location;
    }

    FileLocation const & read_table_location() const override { return m_read_table_location; }

    FileLocation const & signal_table_location() const override { return m_signal_table_location; }

    Version file_version_pre_migration() const override { return m_file_version_pre_migration; }

    SignalType signal_type() const override { return m_signal_table_reader.signal_type(); }

    Result<std::shared_ptr<RunInfoData const>> find_run_info(
        std::string const & acquisition_id) const override
    {
        return m_run_info_table_reader.find_run_info(acquisition_id);
    }

    Result<std::shared_ptr<RunInfoData const>> get_run_info(std::size_t index) const override
    {
        return m_run_info_table_reader.get_run_info(index);
    }

    Result<std::size_t> get_run_info_count() const override
    {
        return m_run_info_table_reader.get_run_info_count();
    }

private:
    Version m_file_version_pre_migration;
    MigrationResult m_migration_result;
    FileLocation m_run_info_table_location;
    FileLocation m_read_table_location;
    FileLocation m_signal_table_location;
    RunInfoTableReader m_run_info_table_reader;
    ReadTableReader m_read_table_reader;
    SignalTableReader m_signal_table_reader;
};

pod5::Result<std::shared_ptr<FileReader>> open_file_reader(
    std::string const & path,
    FileReaderOptions const & options)
{
    auto pool = options.memory_pool();
    if (!pool) {
        return Status::Invalid("Invalid memory pool specified for file writer");
    }

    // Issue warning if the file appears to be a stub
    warn_if_stat_size_and_blocks_differ_significantly(path);

    // "Preflight" file reads are done via standard file I/O first to prevent SIGBUS errors
    // if the file is not resident (e.g. stub remains when file is archived).
    // If mmap succeeds afterwards, use it for normal table reads otherwise continue
    // using this preflight file handle.
    ARROW_ASSIGN_OR_RAISE(auto preflight_file, arrow::io::ReadableFile::Open(path, pool));
    ARROW_ASSIGN_OR_RAISE(
        auto original_footer_metadata, combined_file_utils::read_footer(path, preflight_file));

    std::shared_ptr<arrow::io::RandomAccessFile> file = preflight_file;
    if (!options.force_disable_file_mapping() && getenv("POD5_DISABLE_MMAP_OPEN") == nullptr) {
        auto file_opt = arrow::io::MemoryMappedFile::Open(path, arrow::io::FileMode::READ);
        if (file_opt.ok()) {
            file = *file_opt;
            // Downstream handles are extracted from the `footer.{table}.file`, update them
            // to use the mmap handle.
            combined_file_utils::bind_footer_file(original_footer_metadata, file);
        }
    }

    ARROW_ASSIGN_OR_RAISE(
        auto const original_writer_version,
        parse_version_number(original_footer_metadata.writer_pod5_version));
    ARROW_ASSIGN_OR_RAISE(
        auto migration_result,
        migrate_if_required(original_writer_version, original_footer_metadata, file, pool));

    // Files are written standalone, and so needs to be treated with a file offset - it wants to seek around as if the reads file is standalone:

    ARROW_ASSIGN_OR_RAISE(
        auto run_info_sub_file, open_sub_file(migration_result.footer().run_info_table));
    ARROW_ASSIGN_OR_RAISE(
        auto run_info_table_reader, make_run_info_table_reader(run_info_sub_file, pool));

    ARROW_ASSIGN_OR_RAISE(
        auto reads_sub_file, open_sub_file(migration_result.footer().reads_table));
    ARROW_ASSIGN_OR_RAISE(auto read_table_reader, make_read_table_reader(reads_sub_file, pool));

    ARROW_ASSIGN_OR_RAISE(
        auto signal_sub_file, open_sub_file(migration_result.footer().signal_table));
    ARROW_ASSIGN_OR_RAISE(
        auto signal_table_reader,
        make_signal_table_reader(signal_sub_file, options.max_cached_signal_table_batches(), pool));

    auto signal_metadata = signal_table_reader.schema_metadata();
    auto reads_metadata = read_table_reader.schema_metadata();
    if (signal_metadata.file_identifier != reads_metadata.file_identifier) {
        return Status::Invalid(
            "Invalid read and signal file pair signal identifier: ",
            signal_metadata.file_identifier,
            ", reads identifier: ",
            reads_metadata.file_identifier);
    }

    return std::make_shared<FileReaderImpl>(
        original_writer_version,
        std::move(migration_result),
        std::move(run_info_table_reader),
        std::move(read_table_reader),
        std::move(signal_table_reader));
}

}  // namespace pod5


================================================
FILE: c++/pod5_format/file_reader.h
================================================
#pragma once

#include "pod5_format/pod5_format_export.h"
#include "pod5_format/read_table_utils.h"
#include "pod5_format/result.h"
#include "pod5_format/signal_table_utils.h"

#include <cstdint>
#include <memory>

namespace arrow {
class Array;
class Buffer;
class MemoryPool;
}  // namespace arrow

namespace pod5 {

class Version;
struct SchemaMetadataDescription;

class POD5_FORMAT_EXPORT FileReaderOptions {
public:
    static constexpr std::uint32_t DEFAULT_MAX_CACHED_SIGNAL_TABLE_BATCHES = 5;

    FileReaderOptions();

    void memory_pool(arrow::MemoryPool * memory_pool) { m_memory_pool = memory_pool; }

    arrow::MemoryPool * memory_pool() const { return m_memory_pool; }

    std::size_t max_cached_signal_table_batches() const
    {
        return m_max_cached_signal_table_batches;
    }

    // Set how many signal table batches can be cached in memory,
    // Note: 0 here implies no limit.
    void set_max_cached_signal_table_batches(std::size_t max_cached_signal_table_batches);

    void set_force_disable_file_mapping(bool force_disable_file_mapping)
    {
        m_force_disable_file_mapping = force_disable_file_mapping;
    }

    bool force_disable_file_mapping() const { return m_force_disable_file_mapping; }

private:
    arrow::MemoryPool * m_memory_pool;
    std::size_t m_max_cached_signal_table_batches;
    bool m_force_disable_file_mapping = false;
};

class POD5_FORMAT_EXPORT FileLocation {
public:
    FileLocation(std::string const & file_path_, std::size_t offset_, std::size_t size_)
    : file_path(file_path_)
    , offset(offset_)
    , size(size_)
    {
    }

    std::string file_path;
    std::size_t offset;
    std::size_t size;
};

class ReadTableRecordBatch;
class SignalTableRecordBatch;

class POD5_FORMAT_EXPORT FileReader {
public:
    virtual ~FileReader() = default;

    /// \brief Find the read schema metadata for this file.
    virtual SchemaMetadataDescription schema_metadata() const = 0;

    virtual Result<std::size_t> run_info_count() const = 0;
    virtual Result<std::size_t> read_count() const = 0;

    virtual Result<ReadTableRecordBatch> read_read_record_batch(std::size_t i) const = 0;
    virtual std::size_t num_read_record_batches() const = 0;

    virtual Result<std::size_t> search_for_read_ids(
        ReadIdSearchInput const & search_input,
        gsl::span<uint32_t> const & batch_counts,
        gsl::span<uint32_t> const & batch_rows) const = 0;

    virtual Result<SignalTableRecordBatch> read_signal_record_batch(std::size_t i) const = 0;
    virtual std::size_t num_signal_record_batches() const = 0;
    virtual Result<std::size_t> signal_batch_for_row_id(std::size_t row, std::size_t * batch_row)
        const = 0;
    /// \brief Find the number of samples in a given list of rows.
    /// \param row_indices      The rows to query for sample ount.
    /// \returns The sum of all sample counts on input rows.
    virtual Result<std::size_t> extract_sample_count(
        gsl::span<std::uint64_t const> const & row_indices) const = 0;

    /// \brief Extract the samples for a list of rows.
    /// \param row_indices      The rows to query for samples.
    /// \param output_samples   The output samples from the rows.
    virtual Status extract_samples(
        gsl::span<std::uint64_t const> const & row_indices,
        gsl::span<std::int16_t> const & output_samples) const = 0;

    /// \brief Extract the samples as written in the arrow table for a list of rows.
    /// \param row_indices      The rows to query for samples.
    /// \param sample_count     The output samples from the rows.
    virtual Result<std::vector<std::shared_ptr<arrow::Buffer>>> extract_samples_inplace(
        gsl::span<std::uint64_t const> const & row_indices,
        std::vector<std::uint32_t> & sample_count) const = 0;

    virtual FileLocation const & run_info_table_location() const = 0;
    virtual FileLocation const & read_table_location() const = 0;
    virtual FileLocation const & signal_table_location() const = 0;

    virtual Version file_version_pre_migration() const = 0;

    virtual SignalType signal_type() const = 0;

    virtual Result<std::shared_ptr<RunInfoData const>> find_run_info(
        std::string const & acquisition_id) const = 0;

    virtual Result<std::shared_ptr<RunInfoData const>> get_run_info(std::size_t index) const = 0;
    virtual Result<std::size_t> get_run_info_count() const = 0;
};

POD5_FORMAT_EXPORT pod5::Result<std::shared_ptr<FileReader>> open_file_reader(
    std::string const & path,
    FileReaderOptions const & options = {});

}  // namespace pod5


================================================
FILE: c++/pod5_format/file_recovery.h
================================================
#pragma once

#include "pod5_format/internal/combined_file_utils.h"
#include "pod5_format/schema_metadata.h"

#include <arrow/buffer.h>
#include <arrow/io/file.h>
#include <arrow/ipc/reader.h>
#include <arrow/status.h>

#include <iostream>

namespace pod5 {

static constexpr char const * kArrowMagicBytes = "ARROW1";

struct RecoveredData {
    // Metadata from the original file:
    SchemaMetadataDescription metadata;

    std::size_t recovered_batches = 0;
    arrow::Status failed_batch_status;
    std::size_t recovered_rows = 0;
};

template <typename DestFileType>
arrow::Result<RecoveredData> recover_arrow_file(
    std::shared_ptr<arrow::io::RandomAccessFile> const & file_to_recover,
    DestFileType const & destination_file)
{
    // Check for arrow start file:
    int32_t const magic_size = static_cast<int>(::strlen(kArrowMagicBytes));
    ARROW_ASSIGN_OR_RAISE(auto buffer, file_to_recover->ReadAt(0, magic_size));
    if (buffer->size() < magic_size || memcmp(buffer->data(), kArrowMagicBytes, magic_size)) {
        return arrow::Status::Invalid("Not an Arrow file");
    }

    // Open the stream format within the ipc file:
    ARROW_ASSIGN_OR_RAISE(
        auto input_stream, combined_file_utils::open_sub_file(file_to_recover, 8));
    ARROW_ASSIGN_OR_RAISE(
        auto opened_stream, arrow::ipc::RecordBatchStreamReader::Open(input_stream));

    auto const & expected_schema = destination_file->schema();
    auto schema = opened_stream->schema();
    if (!schema->Equals(*expected_schema, false)) {
        return arrow::Status::Invalid(
            "Recovered file Schema does not match expected schema, version mismatch?");
    }

    RecoveredData recovered_data;
    ARROW_ASSIGN_OR_RAISE(
        recovered_data.metadata, read_schema_key_value_metadata(schema->metadata()));
    while (true) {
        auto result_opt = opened_stream->Next();
        // Check if the batch failed to load:
        if (!result_opt.ok()) {
            recovered_data.failed_batch_status = result_opt.status();
            return recovered_data;
        }

        auto & result = *result_opt;
        if (!result) {
            break;
        }

        recovered_data.recovered_batches += 1;
        recovered_data.recovered_rows += result->num_rows();
        ARROW_RETURN_NOT_OK(destination_file->write_batch(*result));
    }

    return recovered_data;
}

}  // namespace pod5


================================================
FILE: c++/pod5_format/file_updater.cpp
================================================
#include "pod5_format/file_updater.h"

#include "pod5_format/file_reader.h"
#include "pod5_format/internal/combined_file_utils.h"
#include "pod5_format/schema_metadata.h"
#include "pod5_format/uuid.h"

#include <arrow/io/file.h>

namespace pod5 {

pod5::Status update_file(
    arrow::MemoryPool * pool,
    std::shared_ptr<FileReader> const & source,
    std::string destination)
{
    ARROW_ASSIGN_OR_RAISE(auto main_file, arrow::io::FileOutputStream::Open(destination, false));

    std::random_device gen;
    auto uuid_gen = BasicUuidRandomGenerator<std::random_device>{gen};
    auto const section_marker = uuid_gen();

    auto metadata = source->schema_metadata();

    // Write the initial header to the combined file:
    ARROW_RETURN_NOT_OK(combined_file_utils::write_combined_header(main_file, section_marker));

    ARROW_ASSIGN_OR_RAISE(
        auto signal_info_table,
        combined_file_utils::write_file_and_marker(
            pool,
            main_file,
            source->signal_table_location(),
            combined_file_utils::SubFileCleanup::LeaveOrignalFile,
            section_marker));
    ARROW_ASSIGN_OR_RAISE(
        auto run_info_info_table,
        combined_file_utils::write_file_and_marker(
            pool,
            main_file,
            source->run_info_table_location(),
            combined_file_utils::SubFileCleanup::LeaveOrignalFile,
            section_marker));
    ARROW_ASSIGN_OR_RAISE(
        auto reads_info_table,
        combined_file_utils::write_file_and_marker(
            pool,
            main_file,
            source->read_table_location(),
            combined_file_utils::SubFileCleanup::LeaveOrignalFile,
            section_marker));

    // Write full file footer:
    ARROW_RETURN_NOT_OK(
        combined_file_utils::write_footer(
            main_file,
            section_marker,
            metadata.file_identifier,
            metadata.writing_software,
            signal_info_table,
            run_info_info_table,
            reads_info_table));

    return main_file->Close();
}

}  // namespace pod5


================================================
FILE: c++/pod5_format/file_updater.h
================================================
#pragma once

#include "pod5_format/result.h"

#include <memory>

namespace arrow {
class MemoryPool;
}

namespace pod5 {

class FileReader;

/// \brief Write the path [destination] with any migrated data from [source].
/// \param source The source file data to write updated.
/// \param destination The destination path to write the data to.
/// \note The destination path should not be the same file that was opened for input.
pod5::Status update_file(
    arrow::MemoryPool * pool,
    std::shared_ptr<FileReader> const & source,
    std::string destination);

}  // namespace pod5


================================================
FILE: c++/pod5_format/file_writer.cpp
================================================
#include "pod5_format/file_writer.h"

#include "pod5_format/file_recovery.h"
#include "pod5_format/internal/async_output_stream.h"
#include "pod5_format/internal/combined_file_utils.h"
#include "pod5_format/io_manager.h"
#include "pod5_format/memory_pool.h"
#include "pod5_format/read_table_reader.h"
#include "pod5_format/read_table_writer.h"
#include "pod5_format/read_table_writer_utils.h"
#include "pod5_format/run_info_table_writer.h"
#include "pod5_format/schema_metadata.h"
#include "pod5_format/signal_table_reader.h"
#include "pod5_format/signal_table_writer.h"
#include "pod5_format/thread_pool.h"
#include "pod5_format/uuid.h"
#include "pod5_format/version.h"

#include <arrow/io/file.h>
#include <arrow/result.h>
#include <arrow/util/future.h>
#include <arrow/util/key_value_metadata.h>

#include <filesystem>
#include <fstream>
#include <optional>

#ifdef __linux__
#include "pod5_format/internal/linux_output_stream.h"
#endif

namespace {
struct CachedFileValues {
    std::shared_ptr<pod5::IOManager> io_manager;
    std::shared_ptr<pod5::ThreadPool> thread_pool;
};

enum class FlushMode { Default, ForceFlushOnBatchComplete };

arrow::Result<std::shared_ptr<pod5::FileOutputStream>> make_file_stream(
    std::string const & path,
    pod5::FileWriterOptions const & options,
    CachedFileValues & cached_values,
    bool keep_file_open,
    FlushMode flush_mode = FlushMode::Default)
{
    auto const flush_on_batch_complete =
        flush_mode == FlushMode::ForceFlushOnBatchComplete || options.flush_on_batch_complete();
#ifdef __linux__
    if (options.use_directio() || options.use_sync_io()) {
        if (!cached_values.io_manager) {
            if (options.io_manager()) {
                cached_values.io_manager = options.io_manager();
            } else {
                ARROW_ASSIGN_OR_RAISE(
                    cached_values.io_manager, pod5::make_sync_io_manager(options.memory_pool()));
            }
        }
        auto const ret = pod5::LinuxOutputStream::make(
            path,
            cached_values.io_manager,
            options.write_chunk_size(),
            options.use_directio(),
            options.use_sync_io(),
            flush_on_batch_complete,
            keep_file_open);

        // Failure could be due to direct IO used by LinuxOutputStream not being
        // supported. On error drop-through to make a regular AsyncOutputStream.
        if (ret.ok()) {
            return ret;
        }
    }

#endif
    if (!cached_values.thread_pool) {
        if (options.thread_pool()) {
            cached_values.thread_pool = options.thread_pool();
        } else {
            cached_values.thread_pool = pod5::make_thread_pool(1);
        }
    }

    return pod5::AsyncOutputStream::make(
        path,
        cached_values.thread_pool,
        flush_on_batch_complete,
        options.memory_pool(),
        keep_file_open);
}
}  // namespace

namespace pod5 {

FileWriterOptions::FileWriterOptions()
: m_max_signal_chunk_size(DEFAULT_SIGNAL_CHUNK_SIZE)
, m_memory_pool(pod5::default_memory_pool())
, m_signal_type(DEFAULT_SIGNAL_TYPE)
, m_signal_table_batch_size(DEFAULT_SIGNAL_TABLE_BATCH_SIZE)
, m_read_table_batch_size(DEFAULT_READ_TABLE_BATCH_SIZE)
, m_run_info_table_batch_size(DEFAULT_RUN_INFO_TABLE_BATCH_SIZE)
, m_use_directio{DEFAULT_USE_DIRECTIO}
, m_write_chunk_size(DEFAULT_WRITE_CHUNK_SIZE)
, m_use_sync_io(DEFAULT_USE_SYNC_IO)
, m_flush_on_batch_complete(DEFAULT_FLUSH_ON_BATCH_COMPLETE)
, m_keep_signal_file_open(DEFAULT_KEEP_FILES_OPEN)
, m_keep_run_info_file_open(DEFAULT_KEEP_FILES_OPEN)
, m_keep_read_table_file_open(DEFAULT_KEEP_FILES_OPEN)
{
}

class FileWriterImpl {
public:
    class WriterTypeImpl;

    struct DictionaryWriters {
        std::shared_ptr<EndReasonWriter> end_reason_writer;
        std::shared_ptr<PoreWriter> pore_writer;
        std::shared_ptr<RunInfoWriter> run_info_writer;
    };

    FileWriterImpl(
        DictionaryWriters && read_table_dict_writers,
        RunInfoTableWriter && run_info_table_writer,
        ReadTableWriter && read_table_writer,
        SignalTableWriter && signal_table_writer,
        std::uint32_t signal_chunk_size,
        arrow::MemoryPool * pool)
    : m_read_table_dict_writers(std::move(read_table_dict_writers))
    , m_run_info_table_writer(std::move(run_info_table_writer))
    , m_read_table_writer(std::move(read_table_writer))
    , m_signal_table_writer(std::move(signal_table_writer))
    , m_signal_chunk_size(signal_chunk_size)
    , m_pool(pool)
    {
    }

    virtual ~FileWriterImpl() = default;

    virtual std::string path() const = 0;

    pod5::Result<EndReasonDictionaryIndex> lookup_end_reason(ReadEndReason end_reason)
    {
        return m_read_table_dict_writers.end_reason_writer->lookup(end_reason);
    }

    pod5::Result<PoreDictionaryIndex> add_pore_type(std::string const & pore_type_data)
    {
        return m_read_table_dict_writers.pore_writer->add(pore_type_data);
    }

    pod5::Result<RunInfoDictionaryIndex> add_run_info(RunInfoData const & run_info_data)
    {
        ARROW_RETURN_NOT_OK(m_run_info_table_writer->add_run_info(run_info_data));
        return m_read_table_dict_writers.run_info_writer->add(run_info_data.acquisition_id);
    }

    pod5::Status add_complete_read(
        ReadData const & read_data,
        gsl::span<std::int16_t const> const & signal)
    {
        if (!m_signal_table_writer || !m_read_table_writer) {
            return arrow::Status::Invalid("File writer closed, cannot write further data");
        }

        ARROW_RETURN_NOT_OK(check_read(read_data));

        ARROW_ASSIGN_OR_RAISE(
            std::vector<std::uint64_t> signal_rows, add_signal(read_data.read_id, signal));

        // Write read data and signal row entries:
        auto read_table_row = m_read_table_writer->add_read(
            read_data, gsl::make_span(signal_rows.data(), signal_rows.size()), signal.size());
        return read_table_row.status();
    }

    pod5::Status add_complete_read(
        ReadData const & read_data,
        gsl::span<std::uint64_t const> const & signal_rows,
        std::uint64_t signal_duration)
    {
        if (!m_signal_table_writer || !m_read_table_writer) {
            return arrow::Status::Invalid("File writer closed, cannot write further data");
        }

        ARROW_RETURN_NOT_OK(check_read(read_data));

        // Write read data and signal row entries:
        auto read_table_row =
            m_read_table_writer->add_read(read_data, signal_rows, signal_duration);
        return read_table_row.status();
    }

    arrow::Status check_read(ReadData const & read_data)
    {
        if (!m_read_table_dict_writers.run_info_writer->is_valid(read_data.run_info)) {
            return arrow::Status::Invalid("Invalid run info passed to add_read");
        }

        if (!m_read_table_dict_writers.pore_writer->is_valid(read_data.pore_type)) {
            return arrow::Status::Invalid("Invalid pore type passed to add_read");
        }

        if (!m_read_table_dict_writers.end_reason_writer->is_valid(read_data.end_reason)) {
            return arrow::Status::Invalid("Invalid end reason passed to add_read");
        }

        return arrow::Status::OK();
    }

    pod5::Result<std::vector<SignalTableRowIndex>> add_signal(
        Uuid const & read_id,
        gsl::span<std::int16_t const> const & signal)
    {
        if (!m_signal_table_writer || !m_read_table_writer) {
            return arrow::Status::Invalid("File writer closed, cannot write further data");
        }

        std::vector<SignalTableRowIndex> signal_rows;
        signal_rows.reserve((signal.size() / m_signal_chunk_size) + 1);

        // Chunk and write each piece of signal to the file:
        for (std::size_t chunk_start = 0; chunk_start < signal.size();
             chunk_start += m_signal_chunk_size)
        {
            std::size_t chunk_size =
                std::min<std::size_t>(signal.size() - chunk_start, m_signal_chunk_size);

            auto const chunk_span = signal.subspan(chunk_start, chunk_size);

            ARROW_ASSIGN_OR_RAISE(
                auto row_index, m_signal_table_writer->add_signal(read_id, chunk_span));
            signal_rows.push_back(row_index);
        }
        return signal_rows;
    }

    pod5::Result<SignalTableRowIndex> add_pre_compressed_signal(
        Uuid const & read_id,
        gsl::span<std::uint8_t const> const & signal_bytes,
        std::uint32_t sample_count)
    {
        if (!m_signal_table_writer || !m_read_table_writer) {
            return arrow::Status::Invalid("File writer closed, cannot write further data");
        }

        return m_signal_table_writer->add_pre_compressed_signal(
            read_id, signal_bytes, sample_count);
    }

    pod5::Result<std::pair<SignalTableRowIndex, SignalTableRowIndex>> add_signal_batch(
        std::size_t row_count,
        std::vector<std::shared_ptr<arrow::Array>> && columns,
        bool final_batch)
    {
        if (!m_signal_table_writer || !m_read_table_writer) {
            return arrow::Status::Invalid("File writer closed, cannot write further data");
        }

        return m_signal_table_writer->add_signal_batch(row_count, std::move(columns), final_batch);
    }

    SignalType signal_type() const { return m_signal_table_writer->signal_type(); }

    std::size_t signal_table_batch_size() const
    {
        return m_signal_table_writer->table_batch_size();
    }

    pod5::Status close_run_info_table_writer()
    {
        if (m_run_info_table_writer) {
            ARROW_RETURN_NOT_OK(m_run_info_table_writer->close());
            m_run_info_table_writer = std::nullopt;
        }
        return pod5::Status::OK();
    }

    pod5::Status close_read_table_writer()
    {
        if (m_read_table_writer) {
            ARROW_RETURN_NOT_OK(m_read_table_writer->close());
            m_read_table_writer = std::nullopt;
        }
        return pod5::Status::OK();
    }

    pod5::Status close_signal_table_writer()
    {
        if (m_signal_table_writer) {
            ARROW_RETURN_NOT_OK(m_signal_table_writer->close());
            m_signal_table_writer = std::nullopt;
        }
        return pod5::Status::OK();
    }

    virtual arrow::Status close() = 0;

    bool is_closed() const
    {
        assert(!!m_read_table_writer == !!m_signal_table_writer);
        return !m_signal_table_writer;
    }

    arrow::MemoryPool * pool() const { return m_pool; }

    RunInfoTableWriter * run_info_table_writer()
    {
        if (is_closed() || !m_run_info_table_writer.has_value()) {
            return nullptr;
        }
        return &m_run_info_table_writer.value();
    }

    ReadTableWriter * read_table_writer()
    {
        if (is_closed() || !m_read_table_writer.has_value()) {
            return nullptr;
        }
        return &m_read_table_writer.value();
    }

    SignalTableWriter * signal_table_writer()
    {
        if (is_closed() || !m_signal_table_writer.has_value()) {
            return nullptr;
        }
        return &m_signal_table_writer.value();
    }

private:
    DictionaryWriters m_read_table_dict_writers;
    std::optional<RunInfoTableWriter> m_run_info_table_writer;
    std::optional<ReadTableWriter> m_read_table_writer;
    std::optional<SignalTableWriter> m_signal_table_writer;
    std::uint32_t m_signal_chunk_size;
    arrow::MemoryPool * m_pool;
};

class CombinedFileWriterImpl : public FileWriterImpl {
public:
    CombinedFileWriterImpl(
        std::string const & path,
        std::string const & run_info_tmp_path,
        std::string const & reads_tmp_path,
        std::int64_t signal_file_start_offset,
        Uuid const & section_marker,
        Uuid const & file_identifier,
        std::string const & software_name,
        DictionaryWriters && dict_writers,
        RunInfoTableWriter && run_info_table_writer,
        ReadTableWriter && read_table_writer,
        SignalTableWriter && signal_table_writer,
        std::uint32_t signal_chunk_size,
        arrow::MemoryPool * pool)
    : FileWriterImpl(
          std::move(dict_writers),
          std::move(run_info_table_writer),
          std::move(read_table_writer),
          std::move(signal_table_writer),
          signal_chunk_size,
          pool)
    , m_path(path)
    , m_run_info_tmp_path(run_info_tmp_path)
    , m_reads_tmp_path(reads_tmp_path)
    , m_signal_file_start_offset(signal_file_start_offset)
    , m_section_marker(section_marker)
    , m_file_identifier(file_identifier)
    , m_software_name(software_name)
    {
    }

    std::string path() const override { return m_path; }

    arrow::Status close() override
    {
        if (is_closed()) {
            return arrow::Status::OK();
        }
        ARROW_RETURN_NOT_OK(close_run_info_table_writer());
        ARROW_RETURN_NOT_OK(close_read_table_writer());
        ARROW_RETURN_NOT_OK(close_signal_table_writer());

        // Open main path with append set:
        ARROW_ASSIGN_OR_RAISE(auto file, arrow::io::FileOutputStream::Open(m_path, true));

        // Record signal table length:
        combined_file_utils::FileInfo signal_table;
        signal_table.file_start_offset = m_signal_file_start_offset;
        ARROW_ASSIGN_OR_RAISE(signal_table.file_length, file->Tell());
        signal_table.file_length -= signal_table.file_start_offset;

        // pad file to 8 bytes and mark section:
        ARROW_RETURN_NOT_OK(combined_file_utils::pad_file(file, 8));
        ARROW_RETURN_NOT_OK(combined_file_utils::write_section_marker(file, m_section_marker));

        auto file_location_for_full_file =
            [&](std::string const & filename) -> arrow::Result<FileLocation> {
            ARROW_ASSIGN_OR_RAISE(auto file, arrow::io::ReadableFile::Open(filename, pool()));
            ARROW_ASSIGN_OR_RAISE(auto size, file->GetSize());
            return FileLocation{filename, 0, std::size_t(size)};
        };

        // Write in run_info table:
        ARROW_ASSIGN_OR_RAISE(
            auto run_info_location, file_location_for_full_file(m_run_info_tmp_path));
        ARROW_ASSIGN_OR_RAISE(
            auto run_info_info_table,
            combined_file_utils::write_file_and_marker(
                pool(),
                file,
                run_info_location,
                combined_file_utils::SubFileCleanup::CleanupOriginalFile,
                m_section_marker));

        // Write in read table:
        ARROW_ASSIGN_OR_RAISE(auto reads_location, file_location_for_full_file(m_reads_tmp_path));
        ARROW_ASSIGN_OR_RAISE(
            auto reads_info_table,
            combined_file_utils::write_file_and_marker(
                pool(),
                file,
                reads_location,
                combined_file_utils::SubFileCleanup::CleanupOriginalFile,
                m_section_marker));

        // Write full file footer:
        ARROW_RETURN_NOT_OK(
            combined_file_utils::write_footer(
                file,
                m_section_marker,
                m_file_identifier,
                m_software_name,
                signal_table,
                run_info_info_table,
                reads_info_table));
        return arrow::Status::OK();
    }

private:
    std::string m_path;
    std::string m_run_info_tmp_path;
    std::string m_reads_tmp_path;
    std::int64_t m_signal_file_start_offset;
    Uuid m_section_marker;
    Uuid m_file_identifier;
    std::string m_software_name;
};

FileWriter::FileWriter(std::unique_ptr<FileWriterImpl> && impl) : m_impl(std::move(impl)) {}

FileWriter::~FileWriter() { (void)close(); }

std::string FileWriter::path() const { return m_impl->path(); }

arrow::Status FileWriter::close() { return m_impl->close(); }

arrow::Status FileWriter::add_complete_read(
    ReadData const & read_data,
    gsl::span<std::int16_t const> const & signal)
{
    return m_impl->add_complete_read(read_data, signal);
}

arrow::Status FileWriter::add_complete_read(
    ReadData const & read_data,
    gsl::span<std::uint64_t const> const & signal_rows,
    std::uint64_t signal_duration)
{
    return m_impl->add_complete_read(read_data, signal_rows, signal_duration);
}

pod5::Result<std::vector<SignalTableRowIndex>> FileWriter::add_signal(
    Uuid const & read_id,
    gsl::span<std::int16_t const> const & signal)
{
    return m_impl->add_signal(read_id, signal);
}

pod5::Result<SignalTableRowIndex> FileWriter::add_pre_compressed_signal(
    Uuid const & read_id,
    gsl::span<std::uint8_t const> const & signal_bytes,
    std::uint32_t sample_count)
{
    return m_impl->add_pre_compressed_signal(read_id, signal_bytes, sample_count);
}

pod5::Result<std::pair<SignalTableRowIndex, SignalTableRowIndex>> FileWriter::add_signal_batch(
    std::size_t row_count,
    std::vector<std::shared_ptr<arrow::Array>> && columns,
    bool final_batch)
{
    return m_impl->add_signal_batch(row_count, std::move(columns), final_batch);
}

pod5::Result<EndReasonDictionaryIndex> FileWriter::lookup_end_reason(ReadEndReason end_reason) const
{
    return m_impl->lookup_end_reason(end_reason);
}

pod5::Result<PoreDictionaryIndex> FileWriter::add_pore_type(std::string const & pore_type_data)
{
    return m_impl->add_pore_type(pore_type_data);
}

pod5::Result<RunInfoDictionaryIndex> FileWriter::add_run_info(RunInfoData const & run_info_data)
{
    return m_impl->add_run_info(run_info_data);
}

SignalType FileWriter::signal_type() const { return m_impl->signal_type(); }

std::size_t FileWriter::signal_table_batch_size() const
{
    return m_impl->signal_table_batch_size();
}

pod5::Result<FileWriterImpl::DictionaryWriters> make_dictionary_writers(arrow::MemoryPool * pool)
{
    FileWriterImpl::DictionaryWriters writers;

    ARROW_ASSIGN_OR_RAISE(writers.end_reason_writer, pod5::make_end_reason_writer(pool));
    ARROW_ASSIGN_OR_RAISE(writers.pore_writer, pod5::make_pore_writer(pool));
    ARROW_ASSIGN_OR_RAISE(writers.run_info_writer, pod5::make_run_info_writer(pool));

    return writers;
}

std::string make_reads_tmp_path(
    ::arrow::internal::PlatformFilename const & arrow_path,
    Uuid const & file_identifier)
{
    return arrow_path.Parent().ToString() + "/" + ("." + to_string(file_identifier) + ".tmp-reads");
}

std::string make_run_info_tmp_path(
    ::arrow::internal::PlatformFilename const & arrow_path,
    Uuid const & file_identifier)
{
    return arrow_path.Parent().ToString() + "/"
           + ("." + to_string(file_identifier) + ".tmp-run-info");
}

pod5::Result<std::unique_ptr<FileWriter>> create_file_writer(
    std::string const & path,
    std::string const & writing_software_name,
    FileWriterOptions const & options)
{
    auto pool = options.memory_pool();
    if (!pool) {
        return Status::Invalid("Invalid memory pool specified for file writer");
    }

    ARROW_ASSIGN_OR_RAISE(auto arrow_path, ::arrow::internal::PlatformFilename::FromString(path));
    ARROW_ASSIGN_OR_RAISE(bool file_exists, arrow::internal::FileExists(arrow_path));
    if (file_exists) {
        return Status::Invalid("Unable to create new file '", path, "', already exists");
    }

    // Open dictionary writers:
    ARROW_ASSIGN_OR_RAISE(auto dict_writers, make_dictionary_writers(pool));

    // Prep file metadata:
    std::random_device gen;
    auto uuid_gen = BasicUuidRandomGenerator<std::random_device>{gen};
    auto const section_marker = uuid_gen();
    auto const file_identifier = uuid_gen();

    ARROW_ASSIGN_OR_RAISE(auto current_version, parse_version_number(Pod5Version));
    ARROW_ASSIGN_OR_RAISE(
        auto file_schema_metadata,
        make_schema_key_value_metadata({file_identifier, writing_software_name, current_version}));

    auto reads_tmp_path = make_reads_tmp_path(arrow_path, file_identifier);
    auto run_info_tmp_path = make_run_info_tmp_path(arrow_path, file_identifier);

    CachedFileValues cached_values;

    // Prepare the temporary reads file:
    ARROW_ASSIGN_OR_RAISE(
        auto read_table_file_async,
        make_file_stream(
            reads_tmp_path, options, cached_values, options.keep_read_table_file_open()));
    ARROW_ASSIGN_OR_RAISE(
        auto read_table_tmp_writer,
        make_read_table_writer(
            read_table_file_async,
            file_schema_metadata,
            options.read_table_batch_size(),
            dict_writers.pore_writer,
            dict_writers.end_reason_writer,
            dict_writers.run_info_writer,
            pool));

    // Prepare the temporary run_info file:
    //
    // Run info is normally global, if we don't flush on batch complete we can
    // lose a large number of reads in a crash.
    ARROW_ASSIGN_OR_RAISE(
        auto run_info_table_file_async,
        make_file_stream(
            run_info_tmp_path,
            options,
            cached_values,
            options.keep_run_info_file_open(),
            FlushMode::ForceFlushOnBatchComplete));

    ARROW_ASSIGN_OR_RAISE(
        auto run_info_table_tmp_writer,
        make_run_info_table_writer(
            run_info_table_file_async,
            file_schema_metadata,
            options.run_info_table_batch_size(),
            pool));

    // Prepare the main file - and set up the signal table to write here:
    ARROW_ASSIGN_OR_RAISE(
        auto signal_file,
        make_file_stream(path, options, cached_values, options.keep_signal_file_open()));

    // Write the initial header to the combined file:
    ARROW_RETURN_NOT_OK(combined_file_utils::write_combined_header(signal_file, section_marker));

    ARROW_ASSIGN_OR_RAISE(size_t const signal_table_start, signal_file->Tell());

    static_cast<AsyncOutputStream *>(signal_file.get())->set_file_start_offset(signal_table_start);

    // Then place the signal file directly after that:
    ARROW_ASSIGN_OR_RAISE(
        auto signal_table_writer,
        make_signal_table_writer(
            signal_file,
            file_schema_metadata,
            options.signal_table_batch_size(),
            options.signal_type(),
            pool));

    // Throw it all together into a writer object:
    return std::make_unique<FileWriter>(std::make_unique<CombinedFileWriterImpl>(
        path,
        run_info_tmp_path,
        reads_tmp_path,
        signal_table_start,
        section_marker,
        file_identifier,
        writing_software_name,
        std::move(dict_writers),
        std::move(run_info_table_tmp_writer),
        std::move(read_table_tmp_writer),
        std::move(signal_table_writer),
        options.max_signal_chunk_size(),
        pool));
}

static Status add_recovery_failure_context(
    Status status,
    std::string const & tmp_path,
    std::string const & description)
{
    assert(!status.ok());
    std::string const error_context =
        "Failed whilst attempting to recover " + description + " from file - " + tmp_path;
    if (status.detail()) {
        return status.WithMessage(error_context);
    }
    return arrow::Status::FromArgs(status.code(), error_context + ". Detail: " + status.message());
}

template <typename writer_type>
static Status append_recovered_file(
    std::string const & tmp_path,
    writer_type const & destination_writer,
    std::string const & description,
    arrow::MemoryPool * const pool)
{
    arrow::Status inner_status = [&] {
        ARROW_ASSIGN_OR_RAISE(auto file, arrow::io::ReadableFile::Open(tmp_path, pool));
        ARROW_ASSIGN_OR_RAISE(auto size, file->GetSize());
        if (size == 0) {
            return arrow::Status::Invalid("File is empty/zero bytes long.");
        }
        ARROW_ASSIGN_OR_RAISE(
            RecoveredData const recovered_raw_data, recover_arrow_file(file, destination_writer));
        return arrow::Status::OK();
    }();
    if (!inner_status.ok()) {
        return add_recovery_failure_context(inner_status, tmp_path, description);
    }
    return inner_status;
}

namespace {
struct TemporaryFilePaths {
    std::string run_info;
    std::string reads;
};
}  // namespace

static pod5::Status recover_file(
    std::string const & src_path,
    std::string const & dest_path,
    FileWriterOptions const & options,
    TemporaryFilePaths & temporary_file_paths)
{
    if (!check_extension_types_registered()) {
        return arrow::Status::Invalid("POD5 library is not correctly initialised.");
    }

    // Create a file to push recovered data into:
    ARROW_ASSIGN_OR_RAISE(
        auto dest_file, create_file_writer(dest_path, "pod5_file_recovery", options));

    auto pool = arrow::default_memory_pool();
    ARROW_ASSIGN_OR_RAISE(
        auto arrow_path, ::arrow::internal::PlatformFilename::FromString(src_path));
    ARROW_ASSIGN_OR_RAISE(auto file, arrow::io::ReadableFile::Open(src_path, pool));

    // Signature should be right at 0:
    ARROW_RETURN_NOT_OK(combined_file_utils::check_signature(file, 0));

    // Recover the signal data into [dest_file]:
    arrow::Result<RecoveredData> recovered_raw_data;
    {
        ARROW_ASSIGN_OR_RAISE(
            auto raw_sub_file,
            combined_file_utils::open_sub_file(file, combined_file_utils::header_size));
        recovered_raw_data =
            recover_arrow_file(raw_sub_file, dest_file->impl()->signal_table_writer());
    }
    if (!recovered_raw_data.ok()) {
        return add_recovery_failure_context(
            recovered_raw_data.status(), arrow_path.ToString(), "signal data sub file");
    }

    auto file_identifier = recovered_raw_data->metadata.file_identifier;
    temporary_file_paths.run_info = make_run_info_tmp_path(arrow_path, file_identifier);
    temporary_file_paths.reads = make_reads_tmp_path(arrow_path, file_identifier);

    // Recover the run info data into [dest_file]:
    auto run_info_writer = dest_file->impl()->run_info_table_writer();
    ARROW_RETURN_NOT_OK(append_recovered_file(
        temporary_file_paths.run_info, run_info_writer, "run information", pool));

    // Recover the read data into [dest_file]:
    auto read_writer = dest_file->impl()->read_table_writer();
    ARROW_RETURN_NOT_OK(
        append_recovered_file(temporary_file_paths.reads, read_writer, "reads", pool));

    return dest_file->close();
}

/// This is a thorough count of all rows. Doing it this way ensures that all rows can be read.
static pod5::Result<RecoveredRowCounts> count_recovered_rows(
    std::filesystem::path const & recovered_path)
{
    ARROW_ASSIGN_OR_RAISE(
        std::shared_ptr<pod5::FileReader> recovered,
        pod5::open_file_reader(recovered_path.string()));
    RecoveredRowCounts counts;

    std::size_t const signal_batches = recovered->num_signal_record_batches();
    for (std::size_t index = 0; index < signal_batches; ++index) {
        ARROW_ASSIGN_OR_RAISE(auto const signal_batch, recovered->read_signal_record_batch(index));
        counts.signal += signal_batch.num_rows();
    }

    ARROW_ASSIGN_OR_RAISE(counts.run_info, recovered->run_info_count());

    std::size_t const read_batches = recovered->num_read_record_batches();
    for (std::size_t index = 0; index < read_batches; ++index) {
        ARROW_ASSIGN_OR_RAISE(auto const record_batch, recovered->read_read_record_batch(index));
        counts.reads += record_batch.num_rows();
    }
    return counts;
}

/// \brief File is considered useless for recovery if it is 0 bytes long
/// or if all bytes have value 0.
static bool is_useless(std::filesystem::path const & file_path)
{
    if (file_size(file_path) == 0) {
        return true;
    }
    std::ifstream file{file_path, std::ios::in | std::ios::binary};
    if (!file.is_open()) {
        // If we can't open the file, assume there is data, just in case.
        return false;
    }
    while (true) {
        std::uint8_t byte;
        file >> byte;
        if (file.eof()) {
            return true;
        }
        if (byte != 0) {
            return false;
        }
    }
}

static void remove_if_useless(std::filesystem::path const & file_path)
{
    if (exists(file_path) && is_useless(file_path)) {
        remove(file_path);
    }
}

static std::optional<CleanupError> try_remove(std::string const & file_path)
{
    try {
        std::filesystem::remove(file_path);
        return {};
    } catch (std::filesystem::filesystem_error const & error) {
        return CleanupError{.file_path = file_path, .description = error.what()};
    }
}

static Status add_clean_up_error(Status status, std::filesystem::filesystem_error const & exception)
{
    return arrow::Status::FromArgs(status.code(), status.message(), exception.what());
}

pod5::Result<RecoveryDetails> recover_file(
    std::string const & src_path,
    std::string const & dest_path,
    RecoverFileOptions const & options)
{
    TemporaryFilePaths temp_file_paths;
    auto const result = [&]() -> pod5::Result<RecoveredRowCounts> {
        ARROW_RETURN_NOT_OK(
            recover_file(src_path, dest_path, options.file_writer_options, temp_file_paths));
        auto const row_count_result = count_recovered_rows(dest_path);
        if (!row_count_result.ok()) {
            return add_recovery_failure_context(row_count_result.status(), dest_path, "row counts");
        }
        return row_count_result;
    }();
    if (!options.cleanup) {
        auto const to_recovery_details = [](RecoveredRowCounts counts) {
            return RecoveryDetails{counts};
        };
        return result.Map(to_recovery_details);
    }
    if (!result.ok()) {
        try {
            if (std::filesystem::exists(dest_path)) {
                std::filesystem::remove(dest_path);
            }
            remove_if_useless(temp_file_paths.reads);
            remove_if_useless(temp_file_paths.run_info);
            remove_if_useless(src_path);
        } catch (std::filesystem::filesystem_error const & error) {
            return add_clean_up_error(result.status(), error);
        }
        return result.status();
    }

    RecoveryDetails details{.row_counts = *result};
    if (auto const error = try_remove(src_path)) {
        details.cleanup_errors.push_back(*error);
    }
    if (auto const error = try_remove(temp_file_paths.reads)) {
        details.cleanup_errors.push_back(*error);
    }
    if (auto const error = try_remove(temp_file_paths.run_info)) {
        details.cleanup_errors.push_back(*error);
    }
    return details;
}

}  // namespace pod5


================================================
FILE: c++/pod5_format/file_writer.h
================================================
#pragma once

#include "pod5_format/pod5_format_export.h"
#include "pod5_format/read_table_utils.h"
#include "pod5_format/result.h"
#include "pod5_format/signal_table_utils.h"

#include <cstdint>
#include <memory>

namespace arrow {
class Array;
class MemoryPool;
}  // namespace arrow

namespace pod5 {

class IOManager;
class ThreadPool;

class POD5_FORMAT_EXPORT FileWriterOptions {
public:
    /// \brief Default chunk size for signal table entries
    static constexpr std::uint32_t DEFAULT_SIGNAL_CHUNK_SIZE = 102'400;
    static constexpr std::uint32_t DEFAULT_SIGNAL_TABLE_BATCH_SIZE = 100;
    static constexpr std::uint32_t DEFAULT_READ_TABLE_BATCH_SIZE = 1000;
    static constexpr std::uint32_t DEFAULT_RUN_INFO_TABLE_BATCH_SIZE = 1;
    static constexpr SignalType DEFAULT_SIGNAL_TYPE = SignalType::VbzSignal;
    static constexpr bool DEFAULT_USE_DIRECTIO = false;
    static constexpr bool DEFAULT_USE_SYNC_IO = false;
    static constexpr bool DEFAULT_FLUSH_ON_BATCH_COMPLETE = true;
    static constexpr std::size_t DEFAULT_WRITE_CHUNK_SIZE = 2 * 1024 * 1024;
    static constexpr std::size_t DEFAULT_KEEP_FILES_OPEN = true;

    FileWriterOptions();

    void set_max_signal_chunk_size(std::uint32_t chunk_size)
    {
        m_max_signal_chunk_size = chunk_size;
    }

    std::uint32_t max_signal_chunk_size() const { return m_max_signal_chunk_size; }

    void set_memory_pool(arrow::MemoryPool * memory_pool) { m_memory_pool = memory_pool; }

    arrow::MemoryPool * memory_pool() const { return m_memory_pool; }

    void set_signal_type(SignalType signal_type) { m_signal_type = signal_type; }

    SignalType signal_type() const { return m_signal_type; }

    void set_signal_table_batch_size(std::size_t batch_size)
    {
        m_signal_table_batch_size = batch_size;
    }

    std::size_t signal_table_batch_size() const { return m_signal_table_batch_size; }

    void set_read_table_batch_size(std::size_t batch_size) { m_read_table_batch_size = batch_size; }

    std::size_t read_table_batch_size() const { return m_read_table_batch_size; }

    void set_run_info_table_batch_size(std::size_t batch_size)
    {
        m_run_info_table_batch_size = batch_size;
    }

    std::size_t run_info_table_batch_size() const { return m_run_info_table_batch_size; }

    void set_io_manager(std::shared_ptr<IOManager> const & io_manager)
    {
        m_io_manager = io_manager;
    }

    std::shared_ptr<IOManager> io_manager() const { return m_io_manager; }

    void set_thread_pool(std::shared_ptr<ThreadPool> const & writer_thread_pool)
    {
        m_writer_thread_pool = writer_thread_pool;
    }

    std::shared_ptr<ThreadPool> thread_pool() const { return m_writer_thread_pool; }

    void set_use_directio(bool use_directio) { m_use_directio = use_directio; }

    bool use_directio() const { return m_use_directio; }

    void set_write_chunk_size(std::size_t chunk_size) { m_write_chunk_size = chunk_size; }

    std::size_t write_chunk_size() const { return m_write_chunk_size; }

    void set_use_sync_io(bool use_sync_io) { m_use_sync_io = use_sync_io; }

    bool use_sync_io() const { return m_use_sync_io; }

    void set_flush_on_batch_complete(bool flush_on_batch_complete)
    {
        m_flush_on_batch_complete = flush_on_batch_complete;
    }

    bool flush_on_batch_complete() const { return m_flush_on_batch_complete; }

    bool keep_signal_file_open() const { return m_keep_signal_file_open; }

    void set_keep_signal_file_open(bool keep_signal_file_open)
    {
        m_keep_signal_file_open = keep_signal_file_open;
    }

    bool keep_run_info_file_open() const { return m_keep_run_info_file_open; }

    void set_keep_run_info_file_open(bool keep_run_info_file_open)
    {
        m_keep_run_info_file_open = keep_run_info_file_open;
    }

    bool keep_read_table_file_open() const { return m_keep_read_table_file_open; }

    void set_keep_read_table_file_open(bool keep_read_table_file_open)
    {
        m_keep_read_table_file_open = keep_read_table_file_open;
    }

private:
    std::shared_ptr<ThreadPool> m_writer_thread_pool;
    std::shared_ptr<IOManager> m_io_manager;
    std::uint32_t m_max_signal_chunk_size;
    arrow::MemoryPool * m_memory_pool;
    SignalType m_signal_type;
    std::size_t m_signal_table_batch_size;
    std::size_t m_read_table_batch_size;
    std::size_t m_run_info_table_batch_size;
    bool m_use_directio;
    std::size_t m_write_chunk_size;
    bool m_use_sync_io;
    bool m_flush_on_batch_complete;
    bool m_keep_signal_file_open;
    bool m_keep_run_info_file_open;
    bool m_keep_read_table_file_open;
};

class FileWriterImpl;

class POD5_FORMAT_EXPORT FileWriter {
public:
    FileWriter(std::unique_ptr<FileWriterImpl> && impl);
    ~FileWriter();

    std::string path() const;

    pod5::Status close();

    pod5::Status add_complete_read(
        ReadData const & read_data,
        gsl::span<std::int16_t const> const & signal);

    /// \brief Add a complete with rows already pre appended.
    pod5::Status add_complete_read(
        ReadData const & read_data,
        gsl::span<std::uint64_t const> const & signal_rows,
        std::uint64_t signal_duration);

    pod5::Result<std::vector<SignalTableRowIndex>> add_signal(
        Uuid const & read_id,
        gsl::span<std::int16_t const> const & signal);

    pod5::Result<SignalTableRowIndex> add_pre_compressed_signal(
        Uuid const & read_id,
        gsl::span<std::uint8_t const> const & signal_bytes,
        std::uint32_t sample_count);

    pod5::Result<std::pair<SignalTableRowIndex, SignalTableRowIndex>> add_signal_batch(
        std::size_t row_count,
        std::vector<std::shared_ptr<arrow::Array>> && columns,
        bool final_batch);

    // Find or create an end reason index representing this read end reason.
    pod5::Result<EndReasonDictionaryIndex> lookup_end_reason(ReadEndReason end_reason) const;
    pod5::Result<PoreDictionaryIndex> add_pore_type(std::string const & pore_type_data);
    pod5::Result<RunInfoDictionaryIndex> add_run_info(RunInfoData const & run_info_data);

    SignalType signal_type() const;
    std::size_t signal_table_batch_size() const;

    FileWriterImpl * impl() const { return m_impl.get(); };

private:
    std::unique_ptr<FileWriterImpl> m_impl;
};

POD5_FORMAT_EXPORT pod5::Result<std::unique_ptr<FileWriter>> create_file_writer(
    std::string const & path,
    std::string const & writing_software_name,
    FileWriterOptions const & options = {});

struct POD5_FORMAT_EXPORT RecoverFileOptions {
    FileWriterOptions file_writer_options = {};

    /// If this is set to true, recover_file will remove the following files
    ///   * Temp files which we have successfully recovered data from.
    ///   * Temp files which we have failed to recover data from and which hold no data.
    ///   * Output file created during failed recovery.
    bool cleanup = false;
};

struct POD5_FORMAT_EXPORT RecoveredRowCounts final {
    std::size_t signal = 0;
    std::size_t run_info = 0;
    std::size_t reads = 0;
};

struct POD5_FORMAT_EXPORT CleanupError final {
    std::string file_path;
    std::string description;
};

struct POD5_FORMAT_EXPORT RecoveryDetails final {
    RecoveredRowCounts row_counts;
    std::vector<CleanupError> cleanup_errors;
};

POD5_FORMAT_EXPORT pod5::Result<RecoveryDetails> recover_file(
    std::string const & src_path,
    std::string const & dest_path,
    RecoverFileOptions const & options = {});

}  // namespace pod5


================================================
FILE: c++/pod5_format/flatbuffers/footer.fbs
================================================
namespace Minknow.ReadsFormat;

enum ContentType:short {
    // The Reads table (an Arrow table)
    ReadsTable,
    // The Signal table (an Arrow table)
    SignalTable,
    // An index for looking up data in the ReadsTable by read_id
    ReadIdIndex,
    // An index based on other columns and/or tables (it will need to be opened to find out what it indexes)
    OtherIndex,
    // The Run Info table (an Arrow table)
    RunInfoTable,
}

enum Format:short {
    // The Apache Feather V2 format, also known as the Apache Arrow IPC File format.
    FeatherV2,
}

// Describes an embedded file.
table EmbeddedFile {
    // The start of the embedded file
    offset: int64;
    // The length of the embedded file (excluding any padding)
    length: int64;
    // The format of the file
    format: Format;
    // What contents should be expected in the file
    content_type: ContentType;
}

table Footer {
    // Must match the "MINKNOW:file_identifier" custom metadata entry in the schemas of the bundled tables.
    file_identifier: string;
    // A free-form description of the software that wrote the file, intended to help pin down the source of files that violate the specification.
    software: string;
    // The version of this specification that the table schemas are based on (1.0.0).
    pod5_version: string;
    // The Apache Arrow tables stored in the file.
    contents: [ EmbeddedFile ];
}


================================================
FILE: c++/pod5_format/internal/async_output_stream.h
================================================
#pragma once

#include "pod5_format/file_output_stream.h"
#include "pod5_format/internal/tracing/tracing.h"
#include "pod5_format/thread_pool.h"

#include <arrow/buffer.h>
#include <arrow/util/future.h>
#include <gsl/gsl-lite.hpp>

#include <cassert>
#include <condition_variable>
#include <deque>
#include <thread>

namespace pod5 {

class AsyncOutputStream : public FileOutputStream {
    struct PrivateDummy {};

public:
    static arrow::Result<std::shared_ptr<AsyncOutputStream>> make(
        std::string const & file_path,
        std::shared_ptr<ThreadPool> const & thread_pool,
        bool flush_on_batch_complete,
        arrow::MemoryPool * memory_pool = arrow::default_memory_pool(),
        bool keep_file_open = true)
    {
        return std::make_shared<AsyncOutputStream>(
            file_path,
            thread_pool,
            flush_on_batch_complete,
            memory_pool,
            keep_file_open,
            PrivateDummy{});
    }

    ~AsyncOutputStream() { (void)Close(); }

    arrow::Status Close() override
    {
        // flush all output
        ARROW_RETURN_NOT_OK(Flush());

        // and close stream
        std::lock_guard<std::mutex> l{m_file_handle_mutex};
        if (m_file_handle) {
            fclose(m_file_handle);
            m_file_handle = nullptr;
        }
        return arrow::Status::OK();
    }

    arrow::Future<> CloseAsync() override
    {
        ARROW_RETURN_NOT_OK(Close());
        return FileOutputStream::CloseAsync();
    }

    arrow::Status Abort() override
    {
        std::lock_guard<std::mutex> l{m_file_handle_mutex};
        if (m_file_handle) {
            fclose(m_file_handle);
            m_file_handle = nullptr;
        }
        return arrow::Status::OK();
    }

    arrow::Result<int64_t> Tell() const override
    {
        return m_actual_bytes_written - m_file_start_offset;
    }

    bool closed() const override { return m_file_handle == nullptr; }

    arrow::Status Write(void const * data, int64_t nbytes) override
    {
        POD5_TRACE_FUNCTION();
        ARROW_ASSIGN_OR_RAISE(
            std::shared_ptr<arrow::Buffer> buffer, arrow::AllocateBuffer(nbytes, m_memory_pool));
        auto const char_data = static_cast<std::uint8_t const *>(data);
        std::copy(char_data, char_data + nbytes, buffer->mutable_data());
        return Write(buffer);
    }

    arrow::Status Write(std::shared_ptr<arrow::Buffer> const & data) override
    {
        POD5_TRACE_FUNCTION();
        if (m_has_error) {
            return error();
        }

        std::size_t const BUFFER_SIZE = 10 * 1024 * 1024;  // 10mb pending writes max
        while ((m_submitted_byte_writes - m_completed_byte_writes) > BUFFER_SIZE) {
            std::this_thread::sleep_for(std::chrono::milliseconds(5));
        }

        m_submitted_byte_writes += data->size();
        m_actual_bytes_written += data->size();

        m_submitted_writes += 1;
        m_strand->post([&, data] {
            POD5_TRACE_FUNCTION();
            if (m_has_error) {
                return;
            }

            std::lock_guard<std::mutex> l{m_file_handle_mutex};
            auto file_handle = get_or_open_file_handle(l);
            if (!file_handle) {
                set_error(arrow::Status::IOError("Failed to open file handle for writing"));
                return;
            }
            if (fwrite(data->data(), 1, (std::size_t)data->size(), file_handle)
                != (std::size_t)data->size())
            {
                set_error(arrow::Status::IOError("Failed to write data to file"));
                return;
            }
            m_completed_byte_writes += data->size();

            // Ensure we do this after editing all the other members, in order to prevent `Flush`
            // returning until we are done.
            m_completed_writes += 1;

            // Close the file handle if we do not have further writes pending:
            if (m_submitted_writes == m_completed_writes) {
                close_file_handle(l);
            }
        });

        return arrow::Status::OK();
    }

    arrow::Status Flush() override
    {
        POD5_TRACE_FUNCTION();
        // Wait for our completed writes to match our submitted writes,
        // this guarantees our async operations are finished.
        auto wait_for_write_count = m_submitted_writes.load();
        while (m_completed_writes.load() < wait_for_write_count && !m_has_error) {
            std::this_thread::sleep_for(std::chrono::microseconds(10));
        }

        if (m_has_error) {
            return error();
        }

        // No file handle so nothing to flush
        std::lock_guard<std::mutex> l{m_file_handle_mutex};
        if (!m_file_handle) {
            return arrow::Status::OK();
        }

        if (fflush(m_file_handle) != 0) {
            return arrow::Status::IOError("Error flushing file");
        }
        return arrow::Status::OK();
    }

    void set_file_start_offset(std::size_t val) override { m_file_start_offset = val; }

    arrow::Status batch_complete() override
    {
        if (m_flush_on_batch_complete) {
            return Flush();
        }
        return arrow::Status::OK();
    }

    AsyncOutputStream(
        std::string const & file_path,
        std::shared_ptr<ThreadPool> const & thread_pool,
        bool flush_on_batch_complete,
        arrow::MemoryPool * memory_pool,
        bool keep_file_open,
        PrivateDummy)
    : m_has_error{false}
    , m_submitted_writes{0}
    , m_completed_writes{0}
    , m_submitted_byte_writes{0}
    , m_completed_byte_writes{0}
    , m_actual_bytes_written{0}
    , m_flush_on_batch_complete(flush_on_batch_complete)
    , m_file_path(file_path)
    , m_keep_file_open(keep_file_open)
    , m_file_start_offset{0}
    , m_strand{thread_pool->create_strand()}
    , m_memory_pool(memory_pool)
    {
        m_file_handle = fopen(m_file_path.c_str(), "wb");
        if (!m_file_handle) {
            set_error(arrow::Status::IOError("Failed to open file for writing: ", errno));
        }
        if (!m_keep_file_open) {
            fclose(m_file_handle);
            m_file_handle = nullptr;
        }
    }

private:
    arrow::MemoryPool * memory_pool() { return m_memory_pool; }

    FILE * get_or_open_file_handle([[maybe_unused]] std::lock_guard<std::mutex> & lock)
    {
        if (m_file_handle) {
            return m_file_handle;
        }

        m_file_handle = fopen(m_file_path.c_str(), "ab");
        return m_file_handle;
    }

    void close_file_handle([[maybe_unused]] std::lock_guard<std::mutex> & lock)
    {
        if (m_file_handle && !m_keep_file_open) {
            fclose(m_file_handle);
            m_file_handle = nullptr;
        }
    }

    void set_error(arrow::Status status)
    {
        assert(!status.ok());
        {
            std::lock_guard<std::mutex> l{m_error_mutex};
            m_error = std::move(status);
        }
        m_has_error = true;
    }

    arrow::Status error() const
    {
        std::lock_guard<std::mutex> l{m_error_mutex};
        return m_error;
    }

    std::atomic<bool> m_has_error;

    std::atomic<std::size_t> m_submitted_writes;
    std::atomic<std::size_t> m_completed_writes;
    std::atomic<std::size_t> m_submitted_byte_writes;
    std::atomic<std::size_t> m_completed_byte_writes;
    // this represents the number of data bytes written (excluding any padding for alignment)
    // used for truncating the file for instance
    std::int64_t m_actual_bytes_written;

    bool m_flush_on_batch_complete;

    std::string m_file_path;
    std::mutex m_file_handle_mutex;
    FILE * m_file_handle{nullptr};
    bool m_keep_file_open{false};

    mutable std::mutex m_error_mutex;
    arrow::Status m_error;

    std::size_t m_file_start_offset;
    std::shared_ptr<ThreadPoolStrand> m_strand;
    arrow::MemoryPool * m_memory_pool;
};

}  // namespace pod5


================================================
FILE: c++/pod5_format/internal/combined_file_utils.h
================================================
#pragma once

#include "pod5_flatbuffers/footer_generated.h"
#include "pod5_format/file_reader.h"
#include "pod5_format/result.h"
#include "pod5_format/uuid.h"
#include "pod5_format/version.h"

#include <arrow/buffer.h>
#include <arrow/io/file.h>
#include <arrow/util/endian.h>
#include <arrow/util/io_util.h>
#include <flatbuffers/flatbuffers.h>

#include <array>

namespace pod5 { namespace combined_file_utils {

static constexpr std::array<char, 8>
    FILE_SIGNATURE{'\213', 'P', 'O', 'D', '\r', '\n', '\032', '\n'};

static constexpr std::size_t header_size = 24;  // signature 8 bytes, section marker 16 bytes

inline pod5::Status pad_file(
    std::shared_ptr<arrow::io::OutputStream> const & sink,
    std::uint32_t pad_to_size)
{
    ARROW_ASSIGN_OR_RAISE(auto const current_byte_location, sink->Tell());
    auto const bytes_to_write = pad_to_size - (current_byte_location % pad_to_size);
    if (bytes_to_write == pad_to_size) {
        return pod5::Status::OK();
    }

    std::array<char, 128> zeroes{};
    return sink->Write(zeroes.data(), bytes_to_write);
}

inline pod5::Status write_file_signature(std::shared_ptr<arrow::io::OutputStream> const & sink)
{
    return sink->Write(FILE_SIGNATURE.data(), FILE_SIGNATURE.size());
}

inline pod5::Status write_section_marker(
    std::shared_ptr<arrow::io::OutputStream> const & sink,
    Uuid const & section_marker)
{
    return sink->Write(section_marker.data(), section_marker.size());
}

inline pod5::Status write_combined_header(
    std::shared_ptr<arrow::io::OutputStream> const & sink,
    Uuid const & section_marker)
{
    ARROW_RETURN_NOT_OK(write_file_signature(sink));
    return write_section_marker(sink, section_marker);
}

inline pod5::Status write_footer_magic(std::shared_ptr<arrow::io::OutputStream> const & sink)
{
    return sink->Write("FOOTER\0\0", 8);
}

struct FileInfo {
    std::int64_t file_start_offset = 0;
    std::int64_t file_length = 0;
};

struct ParsedFileInfo : FileInfo {
    std::string file_path;
    std::shared_ptr<arrow::io::RandomAccessFile> file;

    arrow::Status from_full_file(std::string in_file_path)
    {
        file_path = in_file_path;
        ARROW_ASSIGN_OR_RAISE(
            file, arrow::io::MemoryMappedFile::Open(in_file_path, arrow::io::FileMode::READ));
        file_start_offset = 0;
        ARROW_ASSIGN_OR_RAISE(file_length, file->GetSize());
        return arrow::Status::OK();
    }
};

inline pod5::Result<std::int64_t> write_footer_flatbuffer(
    std::shared_ptr<arrow::io::OutputStream> const & sink,
    Uuid const & file_identifier,
    std::string const & software_name,
    FileInfo const & signal_table,
    FileInfo const & run_info_table,
    FileInfo const & reads_table)
{
    flatbuffers::FlatBufferBuilder builder(1024);

    auto signal_file = Minknow::ReadsFormat::CreateEmbeddedFile(
        builder,
        signal_table.file_start_offset,
        signal_table.file_length,
        Minknow::ReadsFormat::Format_FeatherV2,
        Minknow::ReadsFormat::ContentType_SignalTable);

    auto run_info_file = Minknow::ReadsFormat::CreateEmbeddedFile(
        builder,
        run_info_table.file_start_offset,
        run_info_table.file_length,
        Minknow::ReadsFormat::Format_FeatherV2,
        Minknow::ReadsFormat::ContentType_RunInfoTable);

    auto reads_file = Minknow::ReadsFormat::CreateEmbeddedFile(
        builder,
        reads_table.file_start_offset,
        reads_table.file_length,
        Minknow::ReadsFormat::Format_FeatherV2,
        Minknow::ReadsFormat::ContentType_ReadsTable);

    std::vector<flatbuffers::Offset<Minknow::ReadsFormat::EmbeddedFile>> const files{
        signal_file, run_info_file, reads_file};
    auto footer = Minknow::ReadsFormat::CreateFooterDirect(
        builder,
        to_string(file_identifier).c_str(),
        software_name.c_str(),
        Pod5Version.c_str(),
        &files);

    builder.Finish(footer);
    ARROW_RETURN_NOT_OK(sink->Write(builder.GetBufferPointer(), builder.GetSize()));
    return builder.GetSize();
}

inline pod5::Status write_footer(
    std::shared_ptr<arrow::io::OutputStream> const & sink,
    Uuid const & section_marker,
    Uuid const & file_identifier,
    std::string const & software_name,
    FileInfo const & signal_table,
    FileInfo const & run_info_table,
    FileInfo const & reads_table)
{
    ARROW_RETURN_NOT_OK(write_footer_magic(sink));
    ARROW_ASSIGN_OR_RAISE(
        std::int64_t length,
        write_footer_flatbuffer(
            sink, file_identifier, software_name, signal_table, run_info_table, reads_table));
    ARROW_RETURN_NOT_OK(pad_file(sink, 8));

    std::int64_t paded_flatbuffer_size = arrow::bit_util::ToLittleEndian(length);
    ARROW_RETURN_NOT_OK(sink->Write(&paded_flatbuffer_size, sizeof(paded_flatbuffer_size)));

    ARROW_RETURN_NOT_OK(write_section_marker(sink, section_marker));
    return write_file_signature(sink);
}

struct ParsedFooter {
    Uuid file_identifier;
    std::string software_name;
    std::string writer_pod5_version;

    ParsedFileInfo run_info_table;
    ParsedFileInfo reads_table;
    ParsedFileInfo signal_table;
};

inline void bind_footer_file(
    ParsedFooter & footer,
    std::shared_ptr<arrow::io::RandomAccessFile> const & file)
{
    footer.reads_table.file = file;
    footer.run_info_table.file = file;
    footer.signal_table.file = file;
}

inline pod5::Status check_signature(
    std::shared_ptr<arrow::io::RandomAccessFile> const & file,
    std::int64_t offset_in_file)
{
    std::array<char, sizeof(FILE_SIGNATURE)> read_signature;
    ARROW_ASSIGN_OR_RAISE(
        auto read_bytes,
        file->ReadAt(offset_in_file, read_signature.size(), read_signature.data()));
    if (read_bytes != (std::int16_t)read_signature.size() || read_signature != FILE_SIGNATURE) {
        return arrow::Status::IOError("Invalid signature in file");
    }

    return arrow::Status::OK();
}

inline pod5::Result<Minknow::ReadsFormat::Footer const *> read_footer_flatbuffer(
    std::vector<std::uint8_t> const & footer_data)
{
    auto verifier = flatbuffers::Verifier(footer_data.data(), footer_data.size());
    if (!verifier.VerifyBuffer<Minknow::ReadsFormat::Footer>()) {
        return arrow::Status::IOError("Invalid footer found in file");
    }
    return flatbuffers::GetRoot<Minknow::ReadsFormat::Footer>(footer_data.data());
}

inline pod5::Result<ParsedFooter> read_footer(
    std::string const & file_path,
    std::shared_ptr<arrow::io::RandomAccessFile> const & file)
{
    // Verify signature at start and end of file:
    ARROW_RETURN_NOT_OK(check_signature(file, 0));
    ARROW_ASSIGN_OR_RAISE(auto const file_size, file->GetSize());
    ARROW_RETURN_NOT_OK(check_signature(file, file_size - FILE_SIGNATURE.size()));

    auto footer_length_data_end = file_size;
    footer_length_data_end -= FILE_SIGNATURE.size();
    footer_length_data_end -= sizeof(Uuid);

    std::int64_t footer_length = 0;
    ARROW_RETURN_NOT_OK(file->ReadAt(
        footer_length_data_end - sizeof(footer_length), sizeof(footer_length), &footer_length));
    footer_length = arrow::bit_util::FromLittleEndian(footer_length);
    if (footer_length < 0
        || static_cast<std::size_t>(footer_length) > footer_length_data_end - sizeof(footer_length))
    {
        return arrow::Status::IOError("Invalid footer length");
    }

    std::vector<std::uint8_t> footer_data;
    footer_data.resize(footer_length);
    ARROW_ASSIGN_OR_RAISE(
        auto read_bytes,
        file->ReadAt(
            footer_length_data_end - sizeof(footer_length) - footer_length,
            footer_length,
            footer_data.data()));
    if (read_bytes != footer_length) {
        return arrow::Status::IOError("Failed to read footer data");
    }
    ARROW_ASSIGN_OR_RAISE(auto fb_footer, read_footer_flatbuffer(footer_data));

    ParsedFooter footer;
    if (!fb_footer->file_identifier()) {
        return arrow::Status::IOError("Invalid footer file_identifier");
    }
    auto const identifier = Uuid::from_string(fb_footer->file_identifier()->str());
    if (!identifier) {
        return Status::IOError(
            "Invalid file_identifier in file: '", fb_footer->file_identifier()->str(), "'");
    }
    footer.file_identifier = *identifier;

    if (!fb_footer->software()) {
        return arrow::Status::IOError("Invalid footer software");
    }
    footer.software_name = fb_footer->software()->str();

    if (!fb_footer->pod5_version()) {
        return arrow::Status::IOError("Invalid footer pod5_version");
    }
    footer.writer_pod5_version = fb_footer->pod5_version()->str();

    if (!fb_footer->contents()) {
        return arrow::Status::IOError("Invalid footer contents");
    }
    for (auto const embedded_file : *fb_footer->contents()) {
        if (embedded_file->format() != Minknow::ReadsFormat::Format_FeatherV2) {
            return arrow::Status::IOError("Invalid embedded file format");
        }
        switch (embedded_file->content_type()) {
        case Minknow::ReadsFormat::ContentType_RunInfoTable:
            footer.run_info_table.file_start_offset = embedded_file->offset();
            footer.run_info_table.file_length = embedded_file->length();
            footer.run_info_table.file = file;
            footer.run_info_table.file_path = file_path;
            break;
        case Minknow::ReadsFormat::ContentType_ReadsTable:
            footer.reads_table.file_start_offset = embedded_file->offset();
            footer.reads_table.file_length = embedded_file->length();
            footer.reads_table.file = file;
            footer.reads_table.file_path = file_path;
            break;
        case Minknow::ReadsFormat::ContentType_SignalTable:
            footer.signal_table.file_start_offset = embedded_file->offset();
            footer.signal_table.file_length = embedded_file->length();
            footer.signal_table.file = file;
            footer.signal_table.file_path = file_path;
            break;

        default:
            return arrow::Status::IOError("Unknown embedded file type");
        }
    }

    return footer;
}

class SubFile : public arrow::io::internal::RandomAccessFileConcurrencyWrapper<SubFile> {
public:
    SubFile(
        std::shared_ptr<arrow::io::RandomAccessFile> main_file,
        std::int64_t sub_file_offset,
        std::int64_t sub_file_length)
    : m_file(std::move(main_file))
    , m_sub_file_offset(sub_file_offset)
    , m_sub_file_length(sub_file_length)
    {
    }

protected:
    arrow::Status DoClose() { return m_file->Close(); }

    bool closed() const override { return m_file->closed(); }

    arrow::Result<std::int64_t> DoTell() const
    {
        ARROW_ASSIGN_OR_RAISE(auto t, m_file->Tell());
        return t - m_sub_file_offset;
    }

    arrow::Status DoSeek(int64_t offset)
    {
        if (offset < 0 || offset > m_sub_file_length) {
            return arrow::Status::IOError("Invalid offset into SubFile");
        }
        offset += m_sub_file_offset;
        return m_file->Seek(offset);
    }

    arrow::Result<std::int64_t> DoRead(int64_t length, void * data)
    {
        ARROW_ASSIGN_OR_RAISE(auto pos, m_file->Tell());
        int64_t const remaining = m_sub_file_offset + m_sub_file_length - pos;
        length = std::min(remaining, length);
        return m_file->Read(length, data);
    }

    arrow::Result<std::shared_ptr<arrow::Buffer>> DoRead(int64_t length)
    {
        ARROW_ASSIGN_OR_RAISE(auto pos, m_file->Tell());
        int64_t const remaining = m_sub_file_offset + m_sub_file_length - pos;
        length = std::min(remaining, length);
        return m_file->Read(length);
    }

    Result<int64_t> DoReadAt(int64_t position, int64_t nbytes, void * out)
    {
        if (position < 0 || position > m_sub_file_length) {
            return arrow::Status::IOError("Invalid offset into SubFile");
        }
        int64_t const remaining = m_sub_file_length - position;
        nbytes = std::min(nbytes, remaining);
        return m_file->ReadAt(position + m_sub_file_offset, nbytes, out);
    }

    Result<std::shared_ptr<arrow::Buffer>> DoReadAt(int64_t position, int64_t nbytes)
    {
        if (position < 0 || position > m_sub_file_length) {
            return arrow::Status::IOError("Invalid offset into SubFile");
        }
        int64_t const remaining = m_sub_file_length - position;
        nbytes = std::min(nbytes, remaining);
        return m_file->ReadAt(position + m_sub_file_offset, nbytes);
    }

    arrow::Result<std::int64_t> DoGetSize() { return m_sub_file_length; }

private:
    friend RandomAccessFileConcurrencyWrapper<SubFile>;

    std::shared_ptr<arrow::io::RandomAccessFile> m_file;
    std::int64_t m_sub_file_offset;
    std::int64_t m_sub_file_length;
};

inline arrow::Result<std::shared_ptr<SubFile>> open_sub_file(ParsedFileInfo file_info)
{
    if (!file_info.file) {
        return arrow::Status::Invalid("Failed to open file from footer");
    }
    ARROW_ASSIGN_OR_RAISE(auto file_size, file_info.file->GetSize());
    if (file_info.file_length < 0 || file_info.file_length > file_size
        || file_info.file_start_offset > file_size - file_info.file_length)
    {
        return arrow::Status::Invalid("Bad footer info");
    }
    // Restrict our open file to just the run info section:
    auto sub_file = std::make_shared<SubFile>(
        file_info.file, file_info.file_start_offset, file_info.file_length);
    ARROW_RETURN_NOT_OK(sub_file->Seek(0));
    return sub_file;
}

inline arrow::Result<std::shared_ptr<SubFile>> open_sub_file(
    std::shared_ptr<arrow::io::RandomAccessFile> const & file,
    std::size_t offset)
{
    if (!file) {
        return arrow::Status::Invalid("Failed to open file from footer");
    }

    ARROW_ASSIGN_OR_RAISE(auto file_size, file->GetSize());

    // Restrict our open file to just the run info section:
    auto sub_file = std::make_shared<SubFile>(file, offset, file_size - offset);
    ARROW_RETURN_NOT_OK(sub_file->Seek(0));
    return sub_file;
}

enum class SubFileCleanup { CleanupOriginalFile, LeaveOrignalFile };

inline arrow::Result<combined_file_utils::FileInfo> write_file(
    arrow::MemoryPool * pool,
    std::shared_ptr<arrow::io::FileOutputStream> const & file,
    FileLocation const & file_location,
    SubFileCleanup cleanup_mode)
{
    combined_file_utils::FileInfo table_data;
    // Record file start location in bytes within the main file:
    ARROW_ASSIGN_OR_RAISE(table_data.file_start_offset, file->Tell());

    {
        // Stream out the reads table into the main file:
        ARROW_ASSIGN_OR_RAISE(
            auto reads_table_file_in, arrow::io::ReadableFile::Open(file_location.file_path, pool));
        ARROW_RETURN_NOT_OK(reads_table_file_in->Seek(file_location.offset));
        std::int64_t copied_bytes = 0;
        std::int64_t target_chunk_size = 10 * 1024 * 1024;  // Read in 10MB of data at a time
        while (copied_bytes < std::int64_t(file_location.size)) {
            std::size_t const to_read =
                std::min<std::int64_t>(file_location.size - copied_bytes, target_chunk_size);
            ARROW_ASSIGN_OR_RAISE(auto const read_buffer, reads_table_file_in->Read(to_read));
            copied_bytes += read_buffer->size();
            ARROW_RETURN_NOT_OK(file->Write(read_buffer));
        }

        // Store the reads file length for later reading:
        ARROW_ASSIGN_OR_RAISE(table_data.file_length, file->Tell());
        table_data.file_length -= table_data.file_start_offset;
    }

    if (cleanup_mode == SubFileCleanup::CleanupOriginalFile) {
        // Clean up the tmp read path:
        ARROW_ASSIGN_OR_RAISE(
            auto arrow_path,
            ::arrow::internal::PlatformFilename::FromString(file_location.file_path));
        ARROW_RETURN_NOT_OK(arrow::internal::DeleteFile(arrow_path));
    }

    return table_data;
}

inline arrow::Result<combined_file_utils::FileInfo> write_file_and_marker(
    arrow::MemoryPool * pool,
    std::shared_ptr<arrow::io::FileOutputStream> const & file,
    FileLocation const & file_location,
    SubFileCleanup cleanup_mode,
    Uuid const & section_marker)
{
    ARROW_ASSIGN_OR_RAISE(auto file_info, write_file(pool, file, file_location, cleanup_mode));
    // Pad file to 8 bytes and mark section:
    ARROW_RETURN_NOT_OK(combined_file_utils::pad_file(file, 8));
    ARROW_RETURN_NOT_OK(combined_file_utils::write_section_marker(file, section_marker));
    return file_info;
}

}}  // namespace pod5::combined_file_utils


================================================
FILE: c++/pod5_format/internal/linux_output_stream.h
================================================
#pragma once

#include "pod5_format/file_output_stream.h"
#include "pod5_format/internal/tracing/tracing.h"
#include "pod5_format/io_manager.h"

#include <arrow/buffer.h>
#include <arrow/util/future.h>
#include <gsl/gsl-lite.hpp>

#include <condition_variable>
#include <deque>

#ifdef __linux__
#include <fcntl.h>
#include <unistd.h>
#endif

namespace pod5 {

namespace {
constexpr size_t fallocate_chunk = 50 * 256 * IOManager::Alignment;  // 50MB
}  // namespace

#ifdef __linux__
class LinuxOutputStream : public FileOutputStream {
    struct PrivateDummy {};

public:
    static arrow::Result<std::shared_ptr<LinuxOutputStream>> make(
        std::string const & file_path,
        std::shared_ptr<IOManager> const & io_manager,
        std::size_t write_chunk_size,
        bool use_directio,
        bool use_syncio,
        bool flush_on_batch_complete,
        bool keep_file_open = true)
    {
        auto flags = O_RDWR | O_CREAT;
        if (use_directio) {
            flags |= O_DIRECT;
        }

        if (use_syncio) {
            flags |= O_SYNC;
        }

        auto const initial_file_descriptor = open(file_path.c_str(), flags, 0644);
        if (initial_file_descriptor < 0) {
            return arrow::Status::Invalid("Failed to open file");
        }

        return std::make_shared<LinuxOutputStream>(
            file_path,
            initial_file_descriptor,
            flags,
            io_manager,
            write_chunk_size,
            keep_file_open,
            flush_on_batch_complete,
            PrivateDummy{});
    }

    ~LinuxOutputStream() { (void)Close(); }

    arrow::Status Close() override
    {
        // flush all output
        ARROW_RETURN_NOT_OK(Flush());

        while (!m_queued_writes.empty()) {
            ARROW_RETURN_NOT_OK(process_queued_writes());

            if (!m_queued_writes.empty()) {
                ARROW_RETURN_NOT_OK(m_io_manager->wait_for_event(std::chrono::seconds(1)));
            }
        }

        std::lock_guard<std::mutex> l{m_file_handle_mutex};
        ARROW_ASSIGN_OR_RAISE(auto const file_descriptor, get_or_open_fd(l));

        // truncate excess data
        if (::ftruncate(file_descriptor, m_bytes_written) < 0) {
            return arrow::Status::IOError("Failed to truncate file");
        }

        // and close stream
        return close_fd(l, true);
    }

    arrow::Future<> CloseAsync() override { return Close(); }

    arrow::Status Abort() override
    {
        std::lock_guard<std::mutex> l{m_file_handle_mutex};
        return close_fd(l, true);
    }

    arrow::Result<int64_t> Tell() const override { return m_bytes_written - m_file_start_offset; }

    bool closed() const override { return m_file_descriptor == -1; }

    arrow::Status Write(void const * data, int64_t nbytes) override
    {
        ARROW_RETURN_NOT_OK(allocate_file_space(nbytes));

        auto remaining_data = gsl::make_span(reinterpret_cast<std::uint8_t const *>(data), nbytes);
        while (!remaining_data.empty()) {
            ARROW_ASSIGN_OR_RAISE(
                remaining_data, m_aligned_buffer.consume_until_full(remaining_data));

            if (m_aligned_buffer.is_full()) {
                ARROW_RETURN_NOT_OK(flush_writes(FlushMode::AlignedWrites));
            }
        }

        m_bytes_written += nbytes;

        return arrow::Status::OK();
    }

    arrow::Status Write(std::shared_ptr<arrow::Buffer> const & data) override
    {
        ARROW_RETURN_NOT_OK(allocate_file_space(data->size()));

        auto remaining_data = gsl::make_span(data->data(), data->size());
        while (!remaining_data.empty()) {
            ARROW_ASSIGN_OR_RAISE(
                remaining_data, m_aligned_buffer.consume_until_full(remaining_data));

            if (m_aligned_buffer.is_full()) {
                ARROW_RETURN_NOT_OK(flush_writes(FlushMode::AlignedWrites));
            }
        }

        m_bytes_written += data->size();

        return arrow::Status::OK();
    }

    arrow::Status batch_complete() override
    {
        if (m_flush_on_batch_complete) {
            return flush_writes(FlushMode::AllWrites);
        }
        return arrow::Status::OK();
    }

    arrow::Status Flush() override
    {
        ARROW_RETURN_NOT_OK(flush_writes(FlushMode::AllWrites));

        std::lock_guard<std::mutex> l{m_file_handle_mutex};
        if (m_file_descriptor < 0) {
            return arrow::Status::OK();
        }

        if (fsync(m_file_descriptor) < 0) {
            return arrow::Status::IOError("Error flushing file");
        }

        return arrow::Status::OK();
    }

    void set_file_start_offset(std::size_t val) override { m_file_start_offset = val; }

    void set_flush_on_batch_complete(bool flush_on_batch_complete)
    {
        m_flush_on_batch_complete = flush_on_batch_complete;
    }

    LinuxOutputStream(
        std::string const & file_path,
        int initial_file_descriptor,
        int flags,
        std::shared_ptr<IOManager> const & io_manager,
        std::size_t write_chunk_size,
        bool keep_file_open,
        bool flush_on_batch_complete,
        PrivateDummy)
    : m_file_path(file_path)
    , m_flags(flags)
    , m_file_descriptor(initial_file_descriptor)
    , m_keep_file_open(keep_file_open)
    , m_aligned_buffer(write_chunk_size, io_manager)
    , m_io_manager(io_manager)
    , m_flush_on_batch_complete(flush_on_batch_complete)
    {
        if (!m_keep_file_open) {
            close(m_file_descriptor);
            m_file_descriptor = -1;
        }
    }

protected:
    enum class FlushMode { AllWrites, AlignedWrites };

    class AlignedBuffer {
    public:
        AlignedBuffer(std::size_t capacity, std::shared_ptr<IOManager> const & io_manager)
        : m_io_manager(io_manager)
        , m_capacity(capacity)
        {
        }

        // Copy input span to the end of the buffer until this buffer is full.
        //
        // Return any remaining buffer.
        arrow::Result<gsl::span<std::uint8_t const>> consume_until_full(
            gsl::span<std::uint8_t const> input)
        {
            ARROW_RETURN_NOT_OK(ensure_next_write());

            auto & buffer = m_next_write->get_buffer();
            assert((std::size_t)buffer.capacity() >= m_capacity);
            auto const remaining_buffer_bytes = buffer.capacity() - buffer.size();
            auto const to_copy = std::min(input.size(), (std::size_t)remaining_buffer_bytes);

            std::copy(
                input.begin(), input.begin() + to_copy, buffer.mutable_data() + buffer.size());
            ARROW_RETURN_NOT_OK(buffer.Resize(buffer.size() + to_copy, false));

            return input.subspan(to_copy);
        }

        // Find if the buffer is full (m_size == m_capacity)
        bool is_full() const
        {
            if (!m_next_write) {
                return false;
            }

            return (std::size_t)m_next_write->get_buffer().size() == m_capacity;
        }

        arrow::Result<std::shared_ptr<QueuedWrite>> release_all_writes_and_align(
            std::size_t * out_aligned_write_size)
        {
            ARROW_RETURN_NOT_OK(ensure_next_write());

            *out_aligned_write_size = aligned_write_size(m_next_write->get_buffer().size());

            auto result_write = std::move(m_next_write);
            auto & result_write_buffer = result_write->get_buffer();
            ARROW_ASSIGN_OR_RAISE(m_next_write, m_io_manager->allocate_new_write(m_capacity));
            auto & next_write_buffer = m_next_write->get_buffer();
            std::copy(
                result_write_buffer.data() + *out_aligned_write_size,
                result_write_buffer.data() + result_write_buffer.size(),
                next_write_buffer.mutable_data());
            ARROW_RETURN_NOT_OK(next_write_buffer.Resize(
                result_write_buffer.size() - *out_aligned_write_size, false));

            // Ensure the result write buffer is aligned to our write alignment.
            auto const result_unaligned_size = result_write_buffer.size();
            auto result_aligned_size =
                result_unaligned_size + (-result_unaligned_size & (IOManager::Alignment - 1));
            ARROW_RETURN_NOT_OK(result_write_buffer.Resize(result_aligned_size, false));
            assert(result_write_buffer.size() % IOManager::Alignment == 0);

            result_write->set_state(QueuedWrite::WriteState::ReadyForWrite);
            return result_write;
        }

        arrow::Result<std::shared_ptr<QueuedWrite>> release_aligned_writes()
        {
            ARROW_RETURN_NOT_OK(ensure_next_write());

            auto result_write = std::move(m_next_write);
            auto & result_write_buffer = result_write->get_buffer();
            ARROW_ASSIGN_OR_RAISE(m_next_write, m_io_manager->allocate_new_write(m_capacity));
            auto & next_write_buffer = m_next_write->get_buffer();

            auto aligned_size = aligned_write_size(result_write_buffer.size());
            std::copy(
                result_write_buffer.data() + aligned_size,
                result_write_buffer.data() + result_write_buffer.size(),
                next_write_buffer.mutable_data());
            ARROW_RETURN_NOT_OK(result_write_buffer.Resize(aligned_size, false));
            ARROW_RETURN_NOT_OK(
                next_write_buffer.Resize(result_write_buffer.size() - aligned_size, false));

            result_write->set_state(QueuedWrite::WriteState::ReadyForWrite);
            return result_write;
        }

    private:
        std::size_t aligned_write_size(std::size_t input_size) const
        {
            return (input_size / IOManager::Alignment) * IOManager::Alignment;
        }

        arrow::Status ensure_next_write()
        {
            if (m_next_write) {
                return arrow::Status::OK();
            }

            ARROW_ASSIGN_OR_RAISE(m_next_write, m_io_manager->allocate_new_write(m_capacity));
            assert((std::size_t)m_next_write->get_buffer().capacity() >= m_capacity);
            return arrow::Status::OK();
        }

        std::shared_ptr<QueuedWrite> m_next_write;
        std::shared_ptr<IOManager> m_io_manager;
        std::size_t m_capacity;
    };

    arrow::Result<int> get_or_open_fd([[maybe_unused]] std::lock_guard<std::mutex> & lock)
    {
        if (m_file_descriptor >= 0) {
            return m_file_descriptor;
        }

        m_file_descriptor = open(m_file_path.c_str(), m_flags, 0644);
        if (m_file_descriptor < 0) {
            return arrow::Status::IOError("Failed to open file for writing");
        }
        return m_file_descriptor;
    }

    arrow::Status close_fd([[maybe_unused]] std::lock_guard<std::mutex> & lock, bool force = false)
    {
        if (m_keep_file_open && !force) {
            return arrow::Status::OK();
        }

        if (close(m_file_descriptor) != 0) {
            return arrow::Status::IOError("Error closing file");
        }
        m_file_descriptor = -1;
        return arrow::Status::OK();
    }

    arrow::Status flush_writes(FlushMode flush_mode)
    {
        std::size_t write_offset{};
        std::shared_ptr<QueuedWrite> released_data;

        if (flush_mode == FlushMode::AllWrites) {
            std::size_t aligned_write_size = 0;
            ARROW_ASSIGN_OR_RAISE(
                released_data, m_aligned_buffer.release_all_writes_and_align(&aligned_write_size));
            write_offset = m_bytes_submitted_to_manager;
            m_bytes_submitted_to_manager += aligned_write_size;
        } else if (flush_mode == FlushMode::AlignedWrites) {
            ARROW_ASSIGN_OR_RAISE(released_data, m_aligned_buffer.release_aligned_writes());
            write_offset = m_bytes_submitted_to_manager;
            m_bytes_submitted_to_manager += released_data->get_buffer().size();
        } else {
            assert(false);
            return arrow::Status::Invalid("Invalid FlushMode Passed.");
        }

        assert(released_data->get_buffer().size() % IOManager::Alignment == 0);

        if (released_data->get_buffer().size() == 0) {
            return arrow::Status::OK();
        }

        std::lock_guard<std::mutex> lock(m_file_handle_mutex);
        ARROW_ASSIGN_OR_RAISE(auto const file_descriptor, get_or_open_fd(lock));
        released_data->prepare_for_write(file_descriptor, write_offset);

        m_queued_writes.emplace_back(released_data);
        ARROW_RETURN_NOT_OK(m_io_manager->write_buffer(std::move(released_data)));

        ARROW_RETURN_NOT_OK(process_queued_writes());

        if (m_queued_writes.empty()) {
            return close_fd(lock);
        } else {
            // If we have queued writes, we keep the file open.
            return arrow::Status::OK();
        }
    }

    arrow::Status process_queued_writes()
    {
        for (auto it = m_queued_writes.begin(); it != m_queued_writes.end();) {
            if ((*it)->state() == QueuedWrite::WriteState::Completed) {
                ARROW_RETURN_NOT_OK(m_io_manager->return_used_write(std::move(*it)));
                it = m_queued_writes.erase(it);
            } else {
                ++it;
            }
        }

        return arrow::Status::OK();
    }

    arrow::Status allocate_file_space(std::size_t new_write_size)
    {
        auto new_total_size = m_bytes_written + new_write_size;
        if (new_total_size > m_fallocate_offset) {
            // reserve more space before continuing
            m_fallocate_offset += fallocate_chunk;

            std::lock_guard<std::mutex> lock(m_file_handle_mutex);
            ARROW_ASSIGN_OR_RAISE(auto const file_descriptor, get_or_open_fd(lock));

            // If this fails, we will just write less optimially, so we ignore the result.
            ::fallocate(file_descriptor, 0, m_fallocate_offset, fallocate_chunk);
        }

        return arrow::Status::OK();
    }

    std::string m_file_path;
    int m_flags;
    std::mutex m_file_handle_mutex;
    int m_file_descriptor;
    bool m_keep_file_open{false};

    AlignedBuffer m_aligned_buffer;
    std::vector<std::shared_ptr<QueuedWrite>> m_queued_writes;
    std::shared_ptr<IOManager> m_io_manager;
    std::size_t m_fallocate_offset{0};
    std::size_t m_file_start_offset{0};
    std::size_t m_bytes_written{0};
    std::size_t m_bytes_submitted_to_manager{0};
    bool m_flush_on_batch_complete;
};
#endif

}  // namespace pod5


================================================
FILE: c++/pod5_format/internal/tracing/tracing.h
================================================
#pragma once

#define POD5_TRACE_FUNCTION()


================================================
FILE: c++/pod5_format/io_manager.cpp
================================================
#include "pod5_format/io_manager.h"

#ifdef __linux__
#include <unistd.h>
#endif

namespace pod5 {

#ifdef __linux__
class IOManagerSyncImpl : public IOManager {
public:
    IOManagerSyncImpl(arrow::MemoryPool * memory_pool) : m_memory_pool(memory_pool) {}

    arrow::Result<std::shared_ptr<QueuedWrite>> allocate_new_write(std::size_t capacity) override
    {
        if (m_queued_writes.size()) {
            auto new_write = m_queued_writes.back();
            m_queued_writes.pop_back();
            ARROW_RETURN_NOT_OK(new_write->reset_queued_write());
            ARROW_RETURN_NOT_OK(new_write->get_buffer().Reserve(capacity));
            assert((std::size_t)new_write->get_buffer().capacity() >= capacity);
            return new_write;
        }

        ARROW_ASSIGN_OR_RAISE(
            std::unique_ptr<arrow::ResizableBuffer> buffer,
            arrow::AllocateResizableBuffer(capacity, IOManager::Alignment, m_memory_pool));
        ARROW_RETURN_NOT_OK(buffer->Resize(0, false));
        assert((std::size_t)buffer->capacity() >= capacity);
        assert((std::size_t)buffer->size() == 0);
        return std::make_shared<QueuedWrite>(std::move(buffer));
    }

    arrow::Status return_used_write(std::shared_ptr<QueuedWrite> && used_write) override
    {
        if (m_queued_writes.size() < CachedBufferCount) {
            m_queued_writes.push_back(std::move(used_write));
        }
        used_write.reset();
        return arrow::Status::OK();
    }

    arrow::Status write_buffer(std::shared_ptr<QueuedWrite> && data) override
    {
        auto result = lseek(data->file_descriptor(), data->file_offset(), SEEK_SET);
        if (result < 0) {
            return arrow::Status::IOError("Error seeking in file");
        }

        result =
            write(data->file_descriptor(), data->get_buffer().data(), data->get_buffer().size());
        if (result < 0) {
            return arrow::Status::IOError(
                "Error writing to file: ",
                errno,
                " desc: ",
                data->file_descriptor(),
                " offset: ",
                data->file_offset(),
                " size: ",
                data->get_buffer().size());
        }

        data->set_state(QueuedWrite::WriteState::Completed);

        return {};
    }

private:
    arrow::MemoryPool * m_memory_pool;
    std::vector<std::shared_ptr<QueuedWrite>> m_queued_writes;
};

arrow::Result<std::shared_ptr<IOManager>> make_sync_io_manager(arrow::MemoryPool * memory_pool)
{
    return std::make_shared<IOManagerSyncImpl>(memory_pool);
}
#endif

}  // namespace pod5


================================================
FILE: c++/pod5_format/io_manager.h
================================================
#pragma once

#include <arrow/buffer.h>
#include <arrow/result.h>
#include <arrow/status.h>

#ifdef __linux__
#include <sys/uio.h>
#endif

#include <atomic>
#include <cassert>
#include <chrono>
#include <memory>

namespace pod5 {

#ifdef __linux__
class QueuedWrite {
public:
    QueuedWrite() = default;

    QueuedWrite(std::unique_ptr<arrow::ResizableBuffer> && buffer) : m_buffer(std::move(buffer)) {}

    arrow::Status reset_queued_write()
    {
        assert(m_state != WriteState::ReadyForWrite);
        assert(m_state != WriteState::InFlight);
        m_iovec = {};
        m_state = WriteState::Empty;
        m_file_offset = -1;
        m_file_descriptor = -1;
        return m_buffer->Resize(0, false);
    }

    void prepare_for_write(int file_descriptor, std::uint64_t offset)
    {
        m_file_descriptor = file_descriptor;
        m_file_offset = offset;
        m_iovec = {.iov_base = m_buffer->mutable_data(), .iov_len = (std::size_t)m_buffer->size()};
        set_state(WriteState::ReadyForWrite);
    }

    arrow::ResizableBuffer & get_buffer() { return *m_buffer; }

    arrow::Buffer const & get_buffer() const { return *m_buffer; }

    int file_descriptor() const { return m_file_descriptor; }

    std::uint64_t file_offset() const { return m_file_offset; }

    iovec * get_iovec_for_buffer() { return &m_iovec; }

    enum class WriteState { Empty, ReadyForWrite, InFlight, Completed };

    WriteState state() const { return m_state; }

    void set_state(WriteState state) { m_state = state; }

private:
    std::unique_ptr<arrow::ResizableBuffer> m_buffer;
    std::uint64_t m_file_offset{(std::uint64_t)-1};
    iovec m_iovec{};
    int m_file_descriptor{-1};
    WriteState m_state{WriteState::Empty};
};
#endif

class IOManager {
public:
    constexpr static size_t Alignment = 4096;  // buffer alignment (for block devices)
    constexpr static size_t CachedBufferCount = 5;

    virtual ~IOManager() = default;

#ifdef __linux__
    virtual arrow::Result<std::shared_ptr<QueuedWrite>> allocate_new_write(
        std::size_t capacity) = 0;
    virtual arrow::Status return_used_write(std::shared_ptr<QueuedWrite> && used_write) = 0;

    virtual arrow::Status write_buffer(std::shared_ptr<QueuedWrite> && data) = 0;

    virtual arrow::Status wait_for_event(std::chrono::nanoseconds timeout) { return {}; }
#endif
};

#ifdef __linux__
arrow::Result<std::shared_ptr<IOManager>> make_sync_io_manager(
    arrow::MemoryPool * memory_pool = arrow::default_memory_pool());
#endif

}  // namespace pod5


================================================
FILE: c++/pod5_format/memory_pool.cpp
================================================
#include "memory_pool.h"

#ifdef _WIN32
#include <windows.h>
#elif !defined(__FreeBSD__)
#include <unistd.h>
#endif

namespace {

// Referenced from the jemalloc source:
// https://github.com/jemalloc/jemalloc/blob/b82333fdec6e5833f88780fcf1fc50b799268e1b/src/pages.c#L596C1-L616C2
size_t os_page_detect(void)
{
#ifdef _WIN32
    SYSTEM_INFO si;
    GetSystemInfo(&si);
    return si.dwPageSize;
#elif defined(__FreeBSD__)
    /*
	 * This returns the value obtained from
	 * the auxv vector, avoiding a syscall.
	 */
    return getpagesize();
#else
    long result = sysconf(_SC_PAGESIZE);
    if (result == -1) {
        return 4095 * 16;  // Default to safe, large page size
    }
    return (size_t)result;
#endif
}

}  // namespace

namespace pod5 {

arrow::MemoryPool * default_memory_pool()
{
    // Default to system memory pool for systems with large pages:
    if (os_page_detect() > 4096) {
        return arrow::system_memory_pool();
    }
    return arrow::default_memory_pool();
}

}  // namespace pod5


================================================
FILE: c++/pod5_format/memory_pool.h
================================================
#pragma once
#include <arrow/memory_pool.h>

namespace pod5 {

/// \brief Find a memory pool that should be used by default when opening or creating a pod5 file.
/// \note This function differs from the arrow equivalent by not using jemalloc on systems with large
///       pages, which jemalloc does not support.
arrow::MemoryPool * default_memory_pool();

}  // namespace pod5


================================================
FILE: c++/pod5_format/migration/migration.cpp
================================================
#include "pod5_format/migration/migration.h"

#include <random>

namespace pod5 {

static bool registered_delete_at_exit_called = false;
std::vector<arrow::internal::PlatformFilename> registered_delete_at_exit_paths;

void register_delete_at_exit(arrow::internal::PlatformFilename const & path)
{
    registered_delete_at_exit_paths.push_back(path);

    if (!registered_delete_at_exit_called) {
        std::atexit([] {
            std::size_t delete_failed = 0;
            for (auto const & path : registered_delete_at_exit_paths) {
                auto result = ::arrow::internal::DeleteDirTree(path);
                if (!result.ok()) {
                    delete_failed += 1;
                }
            }

            if (delete_failed > 0) {
                std::cerr << "Warning: Failed to remove " << delete_failed
                          << " temporary migration directories at exit.\n";
            }
        });
        registered_delete_at_exit_called = true;
    }
}

Result<std::unique_ptr<TemporaryDir>> MakeTmpDir(char const * suffix)
{
    std::default_random_engine gen(
        static_cast<std::default_random_engine::result_type>(arrow::internal::GetRandomSeed()));

    for (std::uint32_t counter = 0; counter < 5; ++counter) {
        std::string tmp_path = std::string{".tmp_"} + suffix;

        tmp_path += "_" + std::to_string(gen());

        ARROW_ASSIGN_OR_RAISE(
            auto filename, arrow::internal::PlatformFilename::FromString(tmp_path));
        ARROW_ASSIGN_OR_RAISE(auto created, CreateDir(filename));
        if (created) {
            return std::make_unique<TemporaryDir>(std::move(filename));
        }
    }

    return arrow::Status::Invalid("Failed to make temporary directory");
}

}  // namespace pod5


================================================
FILE: c++/pod5_format/migration/migration.h
================================================
#pragma once

#include "pod5_format/internal/combined_file_utils.h"
#include "pod5_format/result.h"
#include "pod5_format/schema_utils.h"

#include <arrow/util/io_util.h>

#include <iostream>

namespace pod5 {

void register_delete_at_exit(arrow::internal::PlatformFilename const & path);

class TemporaryDir {
public:
    TemporaryDir(arrow::internal::PlatformFilename && path) : m_path(path) {}

    ~TemporaryDir() { cleanup(); }

    arrow::internal::PlatformFilename const & path() { return m_path; };

    void cleanup()
    {
        if (m_path.ToString().empty()) {
            return;
        }

        auto result = ::arrow::internal::DeleteDirTree(m_path);
        if (!result.ok()) {
            // Push the delete of this directory off to exit, when all open file handles should be closed.
            register_delete_at_exit(m_path);
        } else {
            m_path = {};
        }
    }

private:
    arrow::internal::PlatformFilename m_path;
};

Result<std::unique_ptr<TemporaryDir>> MakeTmpDir(char const * suffix);

class MigrationResult {
public:
    MigrationResult(combined_file_utils::ParsedFooter const & footer) : m_footer(footer) {}

    MigrationResult(MigrationResult &&) = default;
    MigrationResult & operator=(MigrationResult &&) = default;
    MigrationResult(MigrationResult const &) = delete;
    MigrationResult & operator=(MigrationResult const &) = delete;

    combined_file_utils::ParsedFooter & footer() { return m_footer; }

    combined_file_utils::ParsedFooter const & footer() const { return m_footer; }

    void add_temp_dir(std::unique_ptr<TemporaryDir> && temp_dir)
    {
        m_temp_dirs.emplace_back(std::move(temp_dir));
    }

private:
    // This is first so we clean it up last, after the
    // footer and any open files it contains is destroyed.
    std::vector<std::unique_ptr<TemporaryDir>> m_temp_dirs;
    combined_file_utils::ParsedFooter m_footer;
};

arrow::Result<MigrationResult> migrate_v0_to_v1(
    MigrationResult && v0_input,
    arrow::MemoryPool * pool);
arrow::Result<MigrationResult> migrate_v1_to_v2(
    MigrationResult && v1_input,
    arrow::MemoryPool * pool);
arrow::Result<MigrationResult> migrate_v2_to_v3(
    MigrationResult && v2_input,
    arrow::MemoryPool * pool);
arrow::Result<MigrationResult> migrate_v3_to_v4(
    MigrationResult && v2_input,
    arrow::MemoryPool * pool);

inline arrow::Result<MigrationResult> migrate_if_required(
    Version writer_version,
    combined_file_utils::ParsedFooter const & read_footer,
    std::shared_ptr<arrow::io::RandomAccessFile> const & source,
    arrow::MemoryPool * pool)
{
    MigrationResult result{read_footer};

    if (writer_version < Version(0, 0, 24)) {
        // Added fields for read scaling
        ARROW_ASSIGN_OR_RAISE(result, migrate_v0_to_v1(std::move(result), pool));
    }

    if (writer_version < Version(0, 0, 32)) {
        // Added num samples field
        ARROW_ASSIGN_OR_RAISE(result, migrate_v1_to_v2(std::move(result), pool));
    }

    if (writer_version < Version(0, 0, 38)) {
        // Flattening fields
        ARROW_ASSIGN_OR_RAISE(result, migrate_v2_to_v3(std::move(result), pool));
    }
    if (writer_version < Version(0, 3, 30)) {
        // Flattening fields
        ARROW_ASSIGN_OR_RAISE(result, migrate_v3_to_v4(std::move(result), pool));
    }
    return result;
}

}  // namespace pod5


================================================
FILE: c++/pod5_format/migration/migration_utils.h
================================================
#pragma once

#include "pod5_format/internal/combined_file_utils.h"
#include "pod5_format/result.h"
#include "pod5_format/schema_metadata.h"

#include <arrow/array.h>
#include <arrow/ipc/reader.h>
#include <arrow/ipc/writer.h>
#include <arrow/util/key_value_metadata.h>

#include <iterator>

namespace pod5 {

template <typename T, typename U>
arrow::Result<std::shared_ptr<arrow::Array>>
make_filled_array(arrow::MemoryPool * pool, std::size_t row_count, U default_value)
{
    // Minimal iterator to repeat the same value N times.
    // TODO: replace with std::views::repeat in C++23
    struct RepeatIter {
        // These are necessary to make |std::distance| and |std::copy| fast.
        using iterator_category [[maybe_unused]] = std::random_access_iterator_tag;
        using value_type = U const;
        using difference_type = std::int64_t;
        using pointer [[maybe_unused]] = value_type *;
        using reference = value_type &;

        std::size_t m_idx;
        value_type m_value;

        constexpr RepeatIter & operator++()
        {
            m_idx++;
            return *this;
        }

        constexpr RepeatIter operator++(int)
        {
            RepeatIter retval = *this;
            m_idx++;
            return retval;
        }

        constexpr bool operator==(RepeatIter const & other) const { return m_idx == other.m_idx; }

        constexpr bool operator!=(RepeatIter const & other) const { return !operator==(other); }

        constexpr difference_type operator-(RepeatIter const & other) const
        {
            return static_cast<difference_type>(m_idx) - static_cast<difference_type>(other.m_idx);
        }

        constexpr reference operator*() const { return m_value; }
    };

    RepeatIter iter_begin{0, default_value};
    RepeatIter iter_end{row_count, default_value};

    T builder(pool);
    ARROW_RETURN_NOT_OK(builder.AppendValues(iter_begin, iter_end));
    return builder.Finish();
}

inline arrow::Status set_column(
    std::shared_ptr<arrow::Schema> const & schema,
    std::vector<std::shared_ptr<arrow::Array>> & columns,
    char const * field_name,
    arrow::Result<std::shared_ptr<arrow::Array>> const & array)
{
    auto field_index = schema->GetFieldIndex(field_name);
    if (field_index == -1) {
        return arrow::Status::Invalid("Failed to find field '", field_name, "' during migration.");
    }

    if (field_index >= (std::int64_t)columns.size()) {
        columns.resize(field_index + 1);
    }

    ARROW_ASSIGN_OR_RAISE(columns[field_index], array);

    return arrow::Status::OK();
}

inline arrow::Status copy_column(
    std::shared_ptr<arrow::Schema> const & schema_a,
    std::vector<std::shared_ptr<arrow::Array>> & columns_a,
    char const * field_name,
    std::shared_ptr<arrow::Schema> const & schema_b,
    std::vector<std::shared_ptr<arrow::Array>> & columns_b)
{
    auto field_index_a = schema_a->GetFieldIndex(field_name);
    if (field_index_a == -1 || field_index_a >= (std::int64_t)columns_a.size()) {
        return arrow::Status::Invalid("Failed to find field '", field_name, "' during migration.");
    }

    auto source_column = columns_a[field_index_a];

    auto field_index_b = schema_b->GetFieldIndex(field_name);
    if (field_index_b >= (std::int64_t)columns_b.size()) {
        columns_b.resize(field_index_b + 1);
    }

    columns_b[field_index_b] = source_column;

    return arrow::Status::OK();
}

struct Pod5BatchRecordReader {
    std::shared_ptr<arrow::ipc::RecordBatchFileReader> reader;
    std::shared_ptr<arrow::Schema> schema;
    std::shared_ptr<arrow::KeyValueMetadata const> metadata;
};

struct Pod5BatchRecordWriter {
    std::shared_ptr<arrow::ipc::RecordBatchWriter> writer;
    std::shared_ptr<arrow::Schema> schema;

    arrow::Status write_batch(
        std::size_t num_rows,
        std::vector<std::shared_ptr<arrow::Array>> const & columns)
    {
        auto const record_batch = arrow::RecordBatch::Make(schema, num_rows, std::move(columns));
        return writer->WriteRecordBatch(*record_batch);
    }
};

inline pod5::Result<Pod5BatchRecordReader> open_record_batch_reader(
    arrow::MemoryPool * pool,
    combined_file_utils::ParsedFileInfo file_info)
{
    Pod5BatchRecordReader result;
    ARROW_ASSIGN_OR_RAISE(auto file, open_sub_file(file_info));

    arrow::ipc::IpcReadOptions read_options;
    read_options.memory_pool = pool;
    ARROW_ASSIGN_OR_RAISE(
        result.reader, arrow::ipc::RecordBatchFileReader::Open(file, read_options));

    result.schema = result.reader->schema();
    result.metadata = result.schema->metadata();
    if (!result.metadata) {
        return Status::IOError("Missing metadata on read table schema");
    }

    return result;
}

inline pod5::Result<std::shared_ptr<arrow::KeyValueMetadata const>> update_metadata(
    std::shared_ptr<arrow::KeyValueMetadata const> original_metadata,
    Version version_to_write)
{
    auto result = original_metadata->Copy();
    // Update the reader for the new version:
    ARROW_RETURN_NOT_OK(result->Set("MINKNOW:pod5_version", version_to_write.to_string()));
    return result;
}

inline pod5::Result<Pod5BatchRecordWriter> make_record_batch_writer(
    arrow::MemoryPool * pool,
    std::string path,
    std::shared_ptr<arrow::Schema> schema,
    std::shared_ptr<arrow::KeyValueMetadata const> metadata)
{
    ARROW_ASSIGN_OR_RAISE(auto file, arrow::io::FileOutputStream::Open(path, false));
    arrow::ipc::IpcWriteOptions write_options;
    write_options.memory_pool = pool;
    write_options.emit_dictionary_deltas = true;

    Pod5BatchRecordWriter result;
    ARROW_ASSIGN_OR_RAISE(
        result.writer, arrow::ipc::MakeFileWriter(file, schema, write_options, metadata));
    result.schema = schema;

    return result;
}

inline pod5::Status check_columns(
    std::shared_ptr<arrow::Schema> const & schema,
    std::vector<std::shared_ptr<arrow::Array>> const & columns)
{
    for (std::size_t i = 0; i < columns.size(); ++i) {
        auto const & column = columns[i];
        auto const & schema_field = schema->field(i);

        if (auto list = std::dynamic_pointer_cast<arrow::ListArray>(column)) {
            auto last_value = list->value_offset(0);
            for (int i = 1; i <= list->length(); ++i) {
                if (list->value_offset(i) < last_value) {
                    return arrow::Status::Invalid(
                        "Field content for field `",
                        schema_field->name(),
                        "`, list offsets are invalid"
                        " at row index ",
                        i,
                        " (",
                        list->value_offset(i),
                        " < ",
                        last_value,
                        ")");
                }
                last_value = list->value_offset(i);
            }
        } else if (auto dict = std::dynamic_pointer_cast<arrow::DictionaryArray>(column)) {
            auto dict_values = dict->dictionary();
            auto string_dictionary_values =
                std::dynamic_pointer_cast<arrow::StringArray>(dict_values);
            if (string_dictionary_values) {
                auto const value_offsets = string_dictionary_values->value_offsets();
                std::int64_t const value_offsets_length =
                    value_offsets->size() / sizeof(arrow::StringArray::offset_type);
                if (value_offsets_length != (1 + dict_values->length()))
                {  // We expect N+1 offsets for the final element length
                    return arrow::Status::Invalid(
                        "Dictionary length for field `",
                        schema_field->name(),
                        "`, dictionary length is ",
                        dict_values->length(),
                        " but value offsets is length ",
                        value_offsets_length);
                }
            }

            auto indices = std::dynamic_pointer_cast<arrow::Int16Array>(dict->indices());
            if (!indices) {
                return arrow::Status::Invalid(
                    "Field content for field `",
                    schema_field->name(),
                    "`, dictionary indexes are missing");
            }
            for (int i = 0; i < indices->length(); ++i) {
                if (indices->Value(i) >= dict_values->length()) {
                    return arrow::Status::Invalid(
                        "Field content for field `",
                        schema_field->name(),
                        "`, dictionary indexes are invalid"
                        " at row index ",
                        i,
                        " (",
                        indices->Value(i),
                        " >= ",
                        dict_values->length(),
                        ")");
                }
            }
        }
    }

    return {};
}

}  // namespace pod5


================================================
FILE: c++/pod5_format/migration/v0_to_v1.cpp
================================================
#include "pod5_format/migration/migration.h"
#include "pod5_format/migration/migration_utils.h"
#include "pod5_format/table_reader.h"

#include <arrow/array/builder_primitive.h>
#include <arrow/status.h>
#include <arrow/util/io_util.h>

#include <iostream>

namespace pod5 {

arrow::Result<MigrationResult> migrate_v0_to_v1(
    MigrationResult && v0_input,
    arrow::MemoryPool * pool)
{
    ARROW_ASSIGN_OR_RAISE(auto temp_dir, MakeTmpDir("pod5_v0_v1_migration"));
    ARROW_ASSIGN_OR_RAISE(auto v1_reads_table_path, temp_dir->path().Join("reads_table.arrow"));

    {
        ARROW_ASSIGN_OR_RAISE(
            auto v0_reader, open_record_batch_reader(pool, v0_input.footer().reads_table));

        auto v1_new_schama = arrow::schema(
            {arrow::field("num_minknow_events", arrow::uint64()),
             arrow::field("tracked_scaling_scale", arrow::float32()),
             arrow::field("tracked_scaling_shift", arrow::float32()),
             arrow::field("predicted_scaling_scale", arrow::float32()),
             arrow::field("predicted_scaling_shift", arrow::float32()),
             arrow::field("num_reads_since_mux_change", arrow::uint32()),
             arrow::field("time_since_mux_change", arrow::float32())});

        ARROW_ASSIGN_OR_RAISE(
            auto v1_schema, arrow::UnifySchemas({v0_reader.schema, v1_new_schama}));

        ARROW_ASSIGN_OR_RAISE(
            auto new_metadata, update_metadata(v0_reader.metadata, Version(0, 0, 24)));
        ARROW_ASSIGN_OR_RAISE(
            auto v1_writer,
            make_record_batch_writer(
                pool, v1_reads_table_path.ToString(), v1_schema, new_metadata));

        for (std::int64_t batch_idx = 0; batch_idx < v0_reader.reader->num_record_batches();
             ++batch_idx)
        {
            // Read V0 data:
            ARROW_ASSIGN_OR_RAISE(
                auto v0_batch, ReadRecordBatchAndValidate(*v0_reader.reader, batch_idx));
            ARROW_RETURN_NOT_OK(v0_batch->ValidateFull());
            auto const num_rows = v0_batch->num_rows();

            if (num_rows < 0) {
                return arrow::Status::Invalid("Invalid number of rows");
            } else if (POD5_ENABLE_FUZZERS && num_rows > 1'000'000) {
                return arrow::Status::Invalid("Skipping huge sizes when fuzzing");
            }

            // Extend with V1 data:
            std::vector<std::shared_ptr<arrow::Array>> columns = v0_batch->columns();
            ARROW_RETURN_NOT_OK(check_columns(v0_reader.schema, columns));
            ARROW_RETURN_NOT_OK(set_column(
                v1_schema,
                columns,
                "num_minknow_events",
                make_filled_array<arrow::UInt64Builder>(pool, num_rows, 0)));
            ARROW_RETURN_NOT_OK(set_column(
                v1_schema,
                columns,
                "tracked_scaling_scale",
                make_filled_array<arrow::FloatBuilder>(
                    pool, num_rows, std::numeric_limits<float>::quiet_NaN())));
            ARROW_RETURN_NOT_OK(set_column(
                v1_schema,
                columns,
                "tracked_scaling_shift",
                make_filled_array<arrow::FloatBuilder>(
                    pool, num_rows, std::numeric_limits<float>::quiet_NaN())));
            ARROW_RETURN_NOT_OK(set_column(
                v1_schema,
                columns,
                "predicted_scaling_scale",
                make_filled_array<arrow::FloatBuilder>(
                    pool, num_rows, std::numeric_limits<float>::quiet_NaN())));
            ARROW_RETURN_NOT_OK(set_column(
                v1_schema,
                columns,
                "predicted_scaling_shift",
                make_filled_array<arrow::FloatBuilder>(
                    pool, num_rows, std::numeric_limits<float>::quiet_NaN())));
            ARROW_RETURN_NOT_OK(set_column(
                v1_schema,
                columns,
                "num_reads_since_mux_change",
                make_filled_array<arrow::UInt32Builder>(pool, num_rows, 0)));
            ARROW_RETURN_NOT_OK(set_column(
                v1_schema,
                columns,
                "time_since_mux_change",
                make_filled_array<arrow::FloatBuilder>(pool, num_rows, 0.0f)));
            ARROW_RETURN_NOT_OK(v1_writer.write_batch(num_rows, std::move(columns)));
        }

        ARROW_RETURN_NOT_OK(v1_writer.writer->Close());
    }

    // Set up migrated data to point at our new table:
    MigrationResult result = std::move(v0_input);
    ARROW_RETURN_NOT_OK(result.footer().reads_table.from_full_file(v1_reads_table_path.ToString()));
    result.add_temp_dir(std::move(temp_dir));

    return result;
}

}  // namespace pod5


================================================
FILE: c++/pod5_format/migration/v1_to_v2.cpp
================================================
#include "pod5_format/migration/migration.h"
#include "pod5_format/migration/migration_utils.h"
#include "pod5_format/table_reader.h"

#include <arrow/array/builder_primitive.h>
#include <arrow/ipc/reader.h>
#include <arrow/ipc/writer.h>
#include <arrow/util/io_util.h>

#include <iostream>

namespace pod5 {

arrow::Result<std::size_t> get_num_samples(
    std::shared_ptr<arrow::ListArray> const & signal_col,
    std::size_t row_idx,
    std::vector<std::shared_ptr<arrow::RecordBatch>> const & signal_batches)
{
    if (signal_batches.empty()) {
        return 0;
    }

    std::size_t signal_batch_size = signal_batches[0]->num_rows();
    std::size_t num_samples = 0;

    auto values = std::dynamic_pointer_cast<arrow::UInt64Array>(signal_col->values());
    if (!values) {
        return arrow::Status::Invalid("Invalid signal column, potentially corrupt file.");
    }

    auto offset = signal_col->value_offset(row_idx);
    for (std::int64_t index = 0; index < signal_col->value_length(row_idx); ++index) {
        auto const abs_index = offset + index;
        if (abs_index < 0 || abs_index >= values->length()) {
            return arrow::Status::Invalid("Invalid signal column, potentially corrupt file.");
        }

        auto const abs_row = values->Value(abs_index);

        auto const batch_idx = abs_row / signal_batch_size;
        auto const batch_row = abs_row - (batch_idx * signal_batch_size);

        if (batch_idx >= signal_batches.size()) {
            return arrow::Status::Invalid(
                "Invalid signal row ", abs_row, ", cannot find signal batch ", batch_idx);
        }

        auto batch = signal_batches[batch_idx];

        auto samples_column =
            std::dynamic_pointer_cast<arrow::UInt32Array>(batch->GetColumnByName("samples"));
        if (!samples_column) {
            return arrow::Status::Invalid("`samples` column is missing from file");
        }
        if (batch_row >= (std::size_t)samples_column->length()) {
            return arrow::Status::Invalid(
                "Invalid signal batch row ", batch_row, ", length is ", samples_column->length());
        }
        num_samples += samples_column->Value(batch_row);
    }

    return num_samples;
}

arrow::Result<MigrationResult> migrate_v1_to_v2(
    MigrationResult && v1_input,
    arrow::MemoryPool * pool)
{
    ARROW_ASSIGN_OR_RAISE(auto temp_dir, MakeTmpDir("pod5_v1_v2_migration"));
    ARROW_ASSIGN_OR_RAISE(auto v2_reads_table_path, temp_dir->path().Join("reads_table.arrow"));

    {
        ARROW_ASSIGN_OR_RAISE(
            auto v1_reader, open_record_batch_reader(pool, v1_input.footer().reads_table));
        ARROW_ASSIGN_OR_RAISE(
            auto v1_signal_reader, open_record_batch_reader(pool, v1_input.footer().signal_table));
        std::vector<std::shared_ptr<arrow::RecordBatch>> signal_batches(
            v1_signal_reader.reader->num_record_batches());
        for (std::size_t batch_idx = 0;
             batch_idx < (std::size_t)v1_signal_reader.reader->num_record_batches();
             ++batch_idx)
        {
            ARROW_ASSIGN_OR_RAISE(
                signal_batches[batch_idx],
                ReadRecordBatchAndValidate(*v1_signal_reader.reader, batch_idx));
            ARROW_RETURN_NOT_OK(signal_batches[batch_idx]->ValidateFull());
        }

        auto v2_new_schama = arrow::schema({arrow::field("num_samples", arrow::uint64())});
        ARROW_ASSIGN_OR_RAISE(
            auto new_metadata, update_metadata(v1_reader.metadata, Version(0, 0, 32)));
        ARROW_ASSIGN_OR_RAISE(
            auto v2_schema, arrow::UnifySchemas({v1_reader.schema, v2_new_schama}));
        ARROW_ASSIGN_OR_RAISE(
            auto v2_writer,
            make_record_batch_writer(
                pool, v2_reads_table_path.ToString(), v2_schema, new_metadata));

        for (std::int64_t batch_idx = 0; batch_idx < v1_reader.reader->num_record_batches();
             ++batch_idx)
        {
            // Read V1 data:
            ARROW_ASSIGN_OR_RAISE(
                auto v1_batch, ReadRecordBatchAndValidate(*v1_reader.reader, batch_idx));
            ARROW_RETURN_NOT_OK(v1_batch->ValidateFull());
            auto const num_rows = v1_batch->num_rows();

            // Extend with V2 data:
            std::vector<std::shared_ptr<arrow::Array>> columns = v1_batch->columns();

            auto signal_column =
                std::dynamic_pointer_cast<arrow::ListArray>(v1_batch->GetColumnByName("signal"));
            if (!signal_column) {
                return arrow::Status::Invalid("`signal` column is missing from file");
            }
            ARROW_RETURN_NOT_OK(signal_column->ValidateFull());

            arrow::UInt64Builder num_samples_builder;
            for (std::int64_t row = 0; row < num_rows; ++row) {
                ARROW_ASSIGN_OR_RAISE(
                    auto num_samples, get_num_samples(signal_column, row, signal_batches));
                ARROW_RETURN_NOT_OK(num_samples_builder.Append(num_samples));
            }
            ARROW_RETURN_NOT_OK(
                set_column(v2_schema, columns, "num_samples", num_samples_builder.Finish()));
            ARROW_RETURN_NOT_OK(v2_writer.write_batch(num_rows, std::move(columns)));
        }

        ARROW_RETURN_NOT_OK(v2_writer.writer->Close());
    }

    // Set up migrated data to point at our new table:
    MigrationResult result = std::move(v1_input);
    ARROW_RETURN_NOT_OK(result.footer().reads_table.from_full_file(v2_reads_table_path.ToString()));
    result.add_temp_dir(std::move(temp_dir));

    return result;
}

}  // namespace pod5


================================================
FILE: c++/pod5_format/migration/v2_to_v3.cpp
================================================
#include "pod5_format/migration/migration.h"
#include "pod5_format/migration/migration_utils.h"
#include "pod5_format/types.h"

#include <arrow/array/builder_binary.h>
#include <arrow/array/builder_primitive.h>
#include <arrow/ipc/reader.h>
#include <arrow/ipc/writer.h>
#include <arrow/util/io_util.h>

#include <unordered_map>

namespace pod5 {

struct StructRow {
    std::int64_t dict_item_index;
    std::shared_ptr<arrow::StructArray> data;
};

struct StringDictBuilder {
    arrow::Int16Builder indices;
    arrow::StringBuilder items;

    arrow::Result<std::shared_ptr<arrow::Array>> finish()
    {
        ARROW_ASSIGN_OR_RAISE(auto finished_indices, indices.Finish());
        ARROW_ASSIGN_OR_RAISE(auto finished_items, items.Finish());

        auto const & finished_items_val = static_cast<arrow::StringArray const &>(*finished_items);

        // Re append the finished items to the now blank list
        for (std::int64_t i = 0; i < finished_items_val.length(); ++i) {
            ARROW_RETURN_NOT_OK(items.Append(finished_items_val.GetView(i)));
        }

        return arrow::DictionaryArray::FromArrays(finished_indices, finished_items);
    }

    std::unordered_map<std::string, std::int16_t> lookup;
};

arrow::Result<StructRow> get_dict_struct(
    std::shared_ptr<arrow::RecordBatch> const & batch,
    std::size_t row,
    char const * field_name)
{
    auto column = batch->GetColumnByName(field_name);
    if (!column) {
        return Status::Invalid("Failed to find column ", field_name);
    }

    auto dict_column = std::dynamic_pointer_cast<arrow::DictionaryArray>(column);
    if (!dict_column) {
        return Status::Invalid("Found column ", field_name, " is not a dictionary as expected");
    }

    auto dict_items = std::dynamic_pointer_cast<arrow::StructArray>(dict_column->dictionary());
    if (!dict_items) {
        return Status::Invalid("Dictionary column is not a struct as expected");
    }

    return StructRow{dict_column->GetValueIndex(row), dict_items};
}

template <typename ArrayType, typename Builder>
arrow::Status
append_struct_row(StructRow const & struct_row, char const * field_name, Builder & builder)
{
    auto field_array = struct_row.data->GetFieldByName(field_name);
    if (!field_array) {
        return Status::Invalid("Struct is missing ", field_name, " field");
    }

    auto typed_field_array = std::dynamic_pointer_cast<ArrayType>(field_array);
    if (!typed_field_array) {
        return Status::Invalid(field_name, " field is the wrong type");
    }

    if (struct_row.dict_item_index < 0 || struct_row.dict_item_index >= field_array->length()) {
        return Status::Invalid("Dictionary index is out of range");
    }
    return builder.Append(typed_field_array->Value(struct_row.dict_item_index));
}

arrow::Status append_struct_row_to_dict(
    StructRow const & struct_row,
    char const * field_name,
    StringDictBuilder & builder)
{
    auto field_array = struct_row.data->GetFieldByName(field_name);
    if (!field_array) {
        return Status::Invalid("Struct is missing ", field_name, " field");
    }

    auto typed_field_array = std::dynamic_pointer_cast<arrow::StringArray>(field_array);
    if (!typed_field_array) {
        return Status::Invalid(field_name, " field is the wrong type");
    }

    if (struct_row.dict_item_index < 0 || struct_row.dict_item_index >= field_array->length()) {
        return Status::Invalid("Dictionary index is out of range");
    }

    auto str_value = typed_field_array->GetString(struct_row.dict_item_index);
    auto it = builder.lookup.find(str_value);
    if (it != builder.lookup.end()) {
        return builder.indices.Append(it->second);
    }

    auto index = builder.items.length();
    ARROW_RETURN_NOT_OK(builder.items.Append(str_value));
    builder.lookup[str_value] = index;
    return builder.indices.Append(index);
}

arrow::Result<MigrationResult> migrate_v2_to_v3(
    MigrationResult && v2_input,
    arrow::MemoryPool * pool)
{
    ARROW_ASSIGN_OR_RAISE(auto temp_dir, MakeTmpDir("pod5_v2_v3_migration"));
    ARROW_ASSIGN_OR_RAISE(auto v3_reads_table_path, temp_dir->path().Join("reads_table.arrow"));
    ARROW_ASSIGN_OR_RAISE(
        auto v3_run_info_table_path, temp_dir->path().Join("run_info_table.arrow"));

    {
        ARROW_ASSIGN_OR_RAISE(
            auto v2_reader, open_record_batch_reader(pool, v2_input.footer().reads_table));
        ARROW_ASSIGN_OR_RAISE(
            auto new_metadata, update_metadata(v2_reader.metadata, Version(0, 0, 35)));

        auto const num_record_batches = v2_reader.reader->num_record_batches();

        {
            auto v3_reads_schema = arrow::schema(
                {arrow::field("read_id", uuid()),
                 arrow::field("signal", arrow::list(arrow::uint64())),
                 arrow::field("read_number", arrow::uint32()),
                 arrow::field("start", arrow::uint64()),
                 arrow::field("median_before", arrow::float32()),
                 arrow::field("num_minknow_events", arrow::uint64()),
                 arrow::field("tracked_scaling_scale", arrow::float32()),
                 arrow::field("tracked_scaling_shift", arrow::float32()),
                 arrow::field("predicted_scaling_scale", arrow::float32()),
                 arrow::field("predicted_scaling_shift", arrow::float32()),
                 arrow::field("num_reads_since_mux_change", arrow::uint32()),
                 arrow::field("time_since_mux_change", arrow::float32()),
                 arrow::field("num_samples", arrow::uint64()),
                 arrow::field("channel", arrow::uint16()),
                 arrow::field("well", arrow::uint8()),
                 arrow::field("pore_type", arrow::dictionary(arrow::int16(), arrow::utf8())),
                 arrow::field("calibration_offset", arrow::float32()),
                 arrow::field("calibration_scale", arrow::float32()),
                 arrow::field("end_reason", arrow::dictionary(arrow::int16(), arrow::utf8())),
                 arrow::field("end_reason_forced", arrow::boolean()),
                 arrow::field("run_info", arrow::dictionary(arrow::int16(), arrow::utf8()))},
                new_metadata);
            ARROW_ASSIGN_OR_RAISE(
                auto v3_reads_writer,
                make_record_batch_writer(
                    pool, v3_reads_table_path.ToString(), v3_reads_schema, new_metadata));

            std::vector<std::string> const columns_to_copy{
                "read_id",
                "signal",
                "read_number",
                "start",
                "median_before",
                "num_minknow_events",
                "tracked_scaling_scale",
                "tracked_scaling_shift",
                "predicted_scaling_scale",
                "predicted_scaling_shift",
                "num_reads_since_mux_change",
                "time_since_mux_change",
                "num_samples"};

            // Builders for dict columns
            StringDictBuilder pore_type;
            StringDictBuilder end_reason;
            StringDictBuilder run_info;
            for (std::int64_t batch_idx = 0; batch_idx < num_record_batches; ++batch_idx) {
                // Read V2 data:
                ARROW_ASSIGN_OR_RAISE(auto v2_batch, v2_reader.reader->ReadRecordBatch(batch_idx));
                ARROW_RETURN_NOT_OK(v2_batch->ValidateFull());
                auto const num_rows = v2_batch->num_rows();

                std::vector<std::shared_ptr<arrow::Array>> v3_columns;

                // Write V3 data:
                std::vector<std::shared_ptr<arrow::Array>> v2_columns = v2_batch->columns();
                for (auto const & col_name : columns_to_copy) {
                    ARROW_RETURN_NOT_OK(copy_column(
                        v2_reader.schema,
                        v2_columns,
                        col_name.data(),
                        v3_reads_schema,
                        v3_columns));
                }

                arrow::UInt16Builder channel;
                arrow::UInt8Builder well;
                arrow::FloatBuilder calibration_offset;
                arrow::FloatBuilder calibration_scale;
                arrow::BooleanBuilder end_reason_forced;
                for (std::int64_t row = 0; row < num_rows; ++row) {
                    ARROW_ASSIGN_OR_RAISE(
                        auto calibration_data, get_dict_struct(v2_batch, row, "calibration"));
                    ARROW_RETURN_NOT_OK(
                        append_struct_row<arrow::FloatArray>(
                            calibration_data, "offset", calibration_offset));
                    ARROW_RETURN_NOT_OK(
                        append_struct_row<arrow::FloatArray>(
                            calibration_data, "scale", calibration_scale));

                    ARROW_ASSIGN_OR_RAISE(auto pore_data, get_dict_struct(v2_batch, row, "pore"));
                    ARROW_RETURN_NOT_OK(
                        append_struct_row<arrow::UInt16Array>(pore_data, "channel", channel));
                    ARROW_RETURN_NOT_OK(
                        append_struct_row<arrow::UInt8Array>(pore_data, "well", well));
                    ARROW_RETURN_NOT_OK(
                        append_struct_row_to_dict(pore_data, "pore_type", pore_type));

                    ARROW_ASSIGN_OR_RAISE(
                        auto end_reason_data, get_dict_struct(v2_batch, row, "end_reason"));
                    ARROW_RETURN_NOT_OK(
                        append_struct_row_to_dict(end_reason_data, "name", end_reason));
                    ARROW_RETURN_NOT_OK(
                        append_struct_row<arrow::BooleanArray>(
                            end_reason_data, "forced", end_reason_forced));

                    ARROW_ASSIGN_OR_RAISE(
                        auto run_info_data, get_dict_struct(v2_batch, row, "run_info"));
                    ARROW_RETURN_NOT_OK(
                        append_struct_row_to_dict(run_info_data, "acquisition_id", run_info));
                }
                ARROW_RETURN_NOT_OK(set_column(
                    v3_reads_schema,
                    v3_columns,
                    "calibration_offset",
                    calibration_offset.Finish()));
                ARROW_RETURN_NOT_OK(set_column(
                    v3_reads_schema, v3_columns, "calibration_scale", calibration_scale.Finish()));
                ARROW_RETURN_NOT_OK(
                    set_column(v3_reads_schema, v3_columns, "channel", channel.Finish()));
                ARROW_RETURN_NOT_OK(set_column(v3_reads_schema, v3_columns, "well", well.Finish()));
                ARROW_RETURN_NOT_OK(
                    set_column(v3_reads_schema, v3_columns, "pore_type", pore_type.finish()));
                ARROW_RETURN_NOT_OK(
                    set_column(v3_reads_schema, v3_columns, "end_reason", end_reason.finish()));
                ARROW_RETURN_NOT_OK(set_column(
                    v3_reads_schema, v3_columns, "end_reason_forced", end_reason_forced.Finish()));
                ARROW_RETURN_NOT_OK(
                    set_column(v3_reads_schema, v3_columns, "run_info", run_info.finish()));

                ARROW_RETURN_NOT_OK(v3_reads_writer.write_batch(num_rows, std::move(v3_columns)));
            }
            ARROW_RETURN_NOT_OK(v3_reads_writer.writer->Close());
        }

        if (num_record_batches > 0) {
            ARROW_ASSIGN_OR_RAISE(
                auto v2_last_batch, v2_reader.reader->ReadRecordBatch(num_record_batches - 1));
            auto run_info_column = std::dynamic_pointer_cast<arrow::DictionaryArray>(
                v2_last_batch->GetColumnByName("run_info"));
            if (!run_info_column) {
                return arrow::Status::Invalid("Failed to find the run info column");
            }
            auto run_info_dict_type =
                std::dynamic_pointer_cast<arrow::DictionaryType>(run_info_column->type());
            if (!run_info_dict_type) {
                return arrow::Status::Invalid("Failed to find a run info of the right type");
            }
            auto run_info_items =
                std::dynamic_pointer_cast<arrow::StructArray>(run_info_column->dictionary());
            if (!run_info_items) {
                return arrow::Status::Invalid("Failed to find a run info items array");
            }
            auto run_info_items_type =
                std::dynamic_pointer_cast<arrow::StructType>(run_info_items->type());
            if (!run_info_items_type) {
                return arrow::Status::Invalid(
                    "Failed to find a run info items array of the right type");
            }

            // Append all the run info dict-struct data to the new table:
            auto v3_run_info_schema = arrow::schema(run_info_items_type->fields(), new_metadata);
            ARROW_ASSIGN_OR_RAISE(
                auto v3_run_info_writer,
                make_record_batch_writer(
                    pool, v3_run_info_table_path.ToString(), v3_run_info_schema, new_metadata));

            auto const & fields = run_info_items->fields();
            std::vector<std::shared_ptr<arrow::Array>> v3_columns(
                v3_run_info_schema->fields().size());
            for (std::size_t col = 0; col < v3_columns.size(); ++col) {
                v3_columns[col] = fields[col];
            }

            ARROW_RETURN_NOT_OK(
                v3_run_info_writer.write_batch(run_info_items->length(), std::move(v3_columns)));
            ARROW_RETURN_NOT_OK(v3_run_info_writer.writer->Close());
        }
    }

    // Set up migrated data to point at our new table:
    MigrationResult result = std::move(v2_input);
    ARROW_RETURN_NOT_OK(result.footer().reads_table.from_full_file(v3_reads_table_path.ToString()));
    ARROW_RETURN_NOT_OK(
        result.footer().run_info_table.from_full_file(v3_run_info_table_path.ToString()));
    result.add_temp_dir(std::move(temp_dir));

    return result;
}

}  // namespace pod5


================================================
FILE: c++/pod5_format/migration/v3_to_v4.cpp
================================================
#include "pod5_format/migration/migration.h"
#include "pod5_format/migration/migration_utils.h"
#include "pod5_format/table_reader.h"

#include <arrow/array/builder_primitive.h>
#include <arrow/status.h>
#include <arrow/util/io_util.h>

#include <unordered_map>

namespace pod5 {

arrow::Result<MigrationResult> migrate_v3_to_v4(
    MigrationResult && v3_input,
    arrow::MemoryPool * pool)
{
    ARROW_ASSIGN_OR_RAISE(auto temp_dir, MakeTmpDir("pod5_v3_v4_migration"));
    ARROW_ASSIGN_OR_RAISE(auto v4_reads_table_path, temp_dir->path().Join("reads_table.arrow"));

    {
        ARROW_ASSIGN_OR_RAISE(
            auto v3_reader, open_record_batch_reader(pool, v3_input.footer().reads_table));

        auto v4_new_schama = arrow::schema({arrow::field("open_pore_level", arrow::float32())});

        ARROW_ASSIGN_OR_RAISE(
            auto v4_schema, arrow::UnifySchemas({v3_reader.schema, v4_new_schama}));

        ARROW_ASSIGN_OR_RAISE(
            auto new_metadata, update_metadata(v3_reader.metadata, Version(0, 3, 30)));
        ARROW_ASSIGN_OR_RAISE(
            auto v4_writer,
            make_record_batch_writer(
                pool, v4_reads_table_path.ToString(), v4_schema, new_metadata));

        for (std::int64_t batch_idx = 0; batch_idx < v3_reader.reader->num_record_batches();
             ++batch_idx)
        {
            // Read V0 data:
            ARROW_ASSIGN_OR_RAISE(
                auto v3_batch, ReadRecordBatchAndValidate(*v3_reader.reader, batch_idx));
            ARROW_RETURN_NOT_OK(v3_batch->ValidateFull());
            auto const num_rows = v3_batch->num_rows();

            if (num_rows < 0) {
                return arrow::Status::Invalid("Invalid number of rows");
            } else if (POD5_ENABLE_FUZZERS && num_rows > 1'000'000) {
                return arrow::Status::Invalid("Skipping huge sizes when fuzzing");
            }

            // Extend with V4 data:
            std::vector<std::shared_ptr<arrow::Array>> columns = v3_batch->columns();
            ARROW_RETURN_NOT_OK(check_columns(v3_reader.schema, columns));
            ARROW_RETURN_NOT_OK(set_column(
                v4_schema,
                columns,
                "open_pore_level",
                make_filled_array<arrow::FloatBuilder>(
                    pool, num_rows, std::numeric_limits<float>::quiet_NaN())));
            ARROW_RETURN_NOT_OK(v4_writer.write_batch(num_rows, std::move(columns)));
        }

        ARROW_RETURN_NOT_OK(v4_writer.writer->Close());
    }

    // Set up migrated data to point at our new table:
    MigrationResult result = std::move(v3_input);
    ARROW_RETURN_NOT_OK(result.footer().reads_table.from_full_file(v4_reads_table_path.ToString()));
    result.add_temp_dir(std::move(temp_dir));

    return result;
}

}  // namespace pod5


================================================
FILE: c++/pod5_format/read_table_reader.cpp
================================================
#include "pod5_format/read_table_reader.h"

#include "pod5_format/read_table_utils.h"
#include "pod5_format/schema_metadata.h"
#include "pod5_format/schema_utils.h"

#include <arrow/array/array_binary.h>
#include <arrow/array/array_dict.h>
#include <arrow/array/array_nested.h>
#include <arrow/array/array_primitive.h>
#include <arrow/ipc/reader.h>

#include <algorithm>

namespace pod5 {

ReadTableRecordBatch::ReadTableRecordBatch(
    std::shared_ptr<arrow::RecordBatch> && batch,
    std::shared_ptr<ReadTableSchemaDescription const> const & field_locations)
: TableRecordBatch(std::move(batch))
, m_field_locations(field_locations)
{
}

ReadTableRecordBatch::ReadTableRecordBatch(ReadTableRecordBatch && other)
: TableRecordBatch(std::move(other))
, m_field_locations(std::move(other.m_field_locations))
{
}

std::shared_ptr<UuidArray> ReadTableRecordBatch::read_id_column() const
{
    return find_column(batch(), m_field_locations->read_id);
}

std::shared_ptr<arrow::ListArray> ReadTableRecordBatch::signal_column() const
{
    return find_column(batch(), m_field_locations->signal);
}

Result<ReadTableRecordColumns> ReadTableRecordBatch::columns() const
{
    ReadTableRecordColumns result;
    result.table_version = m_field_locations->table_version();

    auto const & bat = batch();

    // V0 fields:
    result.read_id = find_column(bat, m_field_locations->read_id);
    result.signal = find_column(bat, m_field_locations->signal);
    result.read_number = find_column(bat, m_field_locations->read_number);
    result.start_sample = find_column(bat, m_field_locations->start);
    result.median_before = find_column(bat, m_field_locations->median_before);

    // V1 fields:
    if (result.table_version >= ReadTableSpecVersion::v1()) {
        result.num_minknow_events = find_column(bat, m_field_locations->num_minknow_events);

        result.tracked_scaling_scale = find_column(bat, m_field_locations->tracked_scaling_scale);
        result.tracked_scaling_shift = find_column(bat, m_field_locations->tracked_scaling_shift);
        result.predicted_scaling_scale =
            find_column(bat, m_field_locations->predicted_scaling_scale);
        result.predicted_scaling_shift =
            find_column(bat, m_field_locations->predicted_scaling_shift);
        result.num_reads_since_mux_change =
            find_column(bat, m_field_locations->num_reads_since_mux_change);
        result.time_since_mux_change = find_column(bat, m_field_locations->time_since_mux_change);
    }

    // V2 fields:
    if (result.table_version >= ReadTableSpecVersion::v2()) {
        result.num_samples = find_column(bat, m_field_locations->num_samples);
    }

    // V3 fields:
    if (result.table_version >= ReadTableSpecVersion::v3()) {
        result.channel = find_column(bat, m_field_locations->channel);
        result.well = find_column(bat, m_field_locations->well);
        result.pore_type = find_column(bat, m_field_locations->pore_type);
        result.calibration_offset = find_column(bat, m_field_locations->calibration_offset);
        result.calibration_scale = find_column(bat, m_field_locations->calibration_scale);
        result.end_reason = find_column(bat, m_field_locations->end_reason);
        result.end_reason_forced = find_column(bat, m_field_locations->end_reason_forced);
        result.run_info = find_column(bat, m_field_locations->run_info);
    }

    if (result.table_version >= ReadTableSpecVersion::v4()) {
        result.open_pore_level = find_column(bat, m_field_locations->open_pore_level);
    }

    return result;
}

Result<std::shared_ptr<arrow::UInt64Array>> ReadTableRecordBatch::get_signal_rows(
    std::int64_t batch_row) const
{
    auto signal_col = signal_column();

    auto const & values = signal_col->values();

    auto const offset = signal_col->value_offset(batch_row);
    if (offset >= values->length()) {
        return arrow::Status::Invalid(
            "Invalid signal row offset '", offset, "' is outside the size of the values array.");
    }

    auto const length = signal_col->value_length(batch_row);
    if (length > values->length() - offset) {
        return arrow::Status::Invalid(
            "Invalid signal row length '", length, "' is outside the size of the values array.");
    }

    return std::static_pointer_cast<arrow::UInt64Array>(values->Slice(offset, length));
}

template <ReadTableRecordBatch::Dict which>
auto & ReadTableRecordBatch::get_dictionary(
    std::shared_ptr<arrow::DictionaryArray> const & array) const
{
    auto & initialised = m_dictionary_initialised[static_cast<std::size_t>(which)];
    if (initialised.load(std::memory_order_acquire)) {
        return array->dictionary();
    }

    std::lock_guard lock(m_dictionary_access_lock);
    auto & dict = array->dictionary();
    initialised.store(true, std::memory_order_release);
    return dict;
}

Result<std::string> ReadTableRecordBatch::get_pore_type(std::int16_t pore_index) const
{
    if (!m_field_locations->pore_type.found_field()) {
        return arrow::Status::Invalid("pore field is not present in the file");
    }

    auto pore_column = find_column(batch(), m_field_locations->pore_type);
    auto const & pore_dict = get_dictionary<Dict::Pore>(pore_column);
    auto const & pore_data = static_cast<arrow::StringArray const &>(*pore_dict);
    if (pore_index < 0 || pore_index >= pore_data.length()) {
        return arrow::Status::IndexError(
            "Invalid index ", pore_index, " for pore array of length ", pore_data.length());
    }

    return pore_data.GetString(pore_index);
}

Result<std::pair<ReadEndReason, std::string>> ReadTableRecordBatch::get_end_reason(
    std::int16_t end_reason_index) const
{
    if (!m_field_locations->end_reason.found_field()) {
        return arrow::Status::Invalid("end_reason field is not present in the file");
    }

    auto end_reason_column = find_column(batch(), m_field_locations->end_reason);
    auto const & end_reason_dict = get_dictionary<Dict::EndReason>(end_reason_column);
    auto const & end_reason_data = static_cast<arrow::StringArray const &>(*end_reason_dict);
    if (end_reason_index >= end_reason_data.length()) {
        return arrow::Status::IndexError(
            "Invalid index ",
            end_reason_index,
            " for end reason array of length ",
            end_reason_data.length());
    }

    auto str_value = end_reason_data.GetString(end_reason_index);
    auto reason = end_reason_from_string(str_value);

    return std::make_pair(reason, std::move(str_value));
}

Result<std::string> ReadTableRecordBatch::get_run_info(std::int16_t run_info_index) const
{
    if (!m_field_locations->run_info.found_field()) {
        return arrow::Status::Invalid("end_reason field is not present in the file");
    }

    auto run_info_column = find_column(batch(), m_field_locations->run_info);
    auto const & run_info_dict = get_dictionary<Dict::RunInfo>(run_info_column);
    auto const & run_info_data = static_cast<arrow::StringArray const &>(*run_info_dict);
    if (run_info_index < 0 || run_info_index >= run_info_data.length()) {
        return arrow::Status::IndexError(
            "Invalid index ",
            run_info_index,
            " for run info array of length ",
            run_info_data.length());
    }

    return run_info_data.GetString(run_info_index);
}

//---------------------------------------------------------------------------------------------------------------------

ReadTableReader::ReadTableReader(
    std::shared_ptr<void> && input_source,
    std::shared_ptr<arrow::ipc::RecordBatchFileReader> && reader,
    std::shared_ptr<ReadTableSchemaDescription const> const & field_locations,
    SchemaMetadataDescription && schema_metadata,
    arrow::MemoryPool * pool)
: TableReader(std::move(input_source), std::move(reader), std::move(schema_metadata), pool)
, m_field_locations(field_locations)
{
}

ReadTableReader::ReadTableReader(ReadTableReader && other)
: TableReader(std::move(other))
, m_sorted_file_read_ids(std::move(other.m_sorted_file_read_ids))
, m_field_locations(std::move(other.m_field_locations))
{
}

ReadTableReader & ReadTableReader::operator=(ReadTableReader && other)
{
    static_cast<TableReader &>(*this) = std::move(static_cast<TableReader &>(*this));
    m_field_locations = std::move(other.m_field_locations);
    m_sorted_file_read_ids = std::move(other.m_sorted_file_read_ids);
    return *this;
}

Result<ReadTableRecordBatch> ReadTableReader::read_record_batch(std::size_t i) const
{
    std::lock_guard<std::mutex> l(m_batch_get_mutex);
    ARROW_ASSIGN_OR_RAISE(auto record_batch, TableReader::ReadRecordBatch(i));
    return ReadTableRecordBatch{std::move(record_batch), m_field_locations};
}

Status ReadTableReader::build_read_id_lookup() const
{
    std::lock_guard lock(m_sorted_file_read_ids_mutex);

    if (!m_sorted_file_read_ids.empty()) {
        return Status::OK();
    }

    std::vector<IndexData> file_read_ids;

    auto const batch_count = num_record_batches();
    std::size_t abs_row_count = 0;

    // Loop each batch and copy read ids out into the index:
    for (std::size_t i = 0; i < batch_count; ++i) {
        ARROW_ASSIGN_OR_RAISE(auto batch, read_record_batch(i));

        if (file_read_ids.empty()) {
            file_read_ids.reserve(batch.num_rows() * batch_count);
        }
        file_read_ids.resize(file_read_ids.size() + batch.num_rows());

        auto read_id_col = batch.read_id_column();
        auto raw_read_id_values = read_id_col->raw_values();
        for (std::size_t row = 0; row < (std::size_t)read_id_col->length(); ++row) {
            // Record the id, and its location within the file:
            file_read_ids[abs_row_count].id = raw_read_id_values[row];
            file_read_ids[abs_row_count].batch = i;
            file_read_ids[abs_row_count].batch_row = row;
            abs_row_count += 1;
        }
    }

    // Sort by read id for searching later:
    std::sort(file_read_ids.begin(), file_read_ids.end(), [](auto const & a, auto const & b) {
        return a.id < b.id;
    });

    // Move data out now we successfully build the index:
    m_sorted_file_read_ids = std::move(file_read_ids);

    return Status::OK();
}

Result<std::size_t> ReadTableReader::search_for_read_ids(
    ReadIdSearchInput const & search_input,
    gsl::span<uint32_t> const & batch_counts,
    gsl::span<uint32_t> const & batch_rows) const
{
    ARROW_RETURN_NOT_OK(build_read_id_lookup());

    if (m_sorted_file_read_ids.empty()) {
        return 0;
    }

    std::size_t successes = 0;

    std::vector<std::vector<std::uint32_t>> batch_data(batch_counts.size());
    auto const initial_reserve_size = search_input.read_id_count() / batch_counts.size();
    for (auto & br : batch_data) {
        br.reserve(initial_reserve_size);
    }

    auto file_ids_current_it = m_sorted_file_read_ids.begin();
    auto const file_ids_end = m_sorted_file_read_ids.end();
    for (std::size_t i = 0; i < search_input.read_id_count(); ++i) {
        auto const & search_item = search_input[i];

        // Increment file pointer while less than the search term:
        while (file_ids_current_it != file_ids_end && file_ids_current_it->id < search_item.id) {
            ++file_ids_current_it;
        }

        // No more ids to search, both lists are sorted and we haven't found this one, we won't find any others.
        if (file_ids_current_it == file_ids_end) {
            break;
        }

        // If we found it record the location:
        if (file_ids_current_it->id == search_item.id) {
            batch_data[file_ids_current_it->batch].push_back(file_ids_current_it->batch_row);
            successes += 1;
        }
    }

    std::size_t full_size_so_far = 0;
    for (std::size_t i = 0; i < batch_data.size(); ++i) {
        auto & data = batch_data[i];
        batch_counts[i] = data.size();

        // Ensure the batch indices within the batch are sorted:
        std::sort(data.begin(), data.end());

        // Copy the row indices into the packed vector:
        std::copy(data.begin(), data.end(), batch_rows.begin() + full_size_so_far);

        full_size_so_far += data.size();
    }

    return successes;
}

//---------------------------------------------------------------------------------------------------------------------

Result<ReadTableReader> make_read_table_reader(
    std::shared_ptr<arrow::io::RandomAccessFile> const & input,
    arrow::MemoryPool * pool)
{
    arrow::ipc::IpcReadOptions options;
    options.memory_pool = pool;

    ARROW_ASSIGN_OR_RAISE(auto reader, arrow::ipc::RecordBatchFileReader::Open(input, options));

    auto read_metadata_key_values = reader->schema()->metadata();
    if (!read_metadata_key_values) {
        return Status::IOError("Missing metadata on read table schema");
    }
    ARROW_ASSIGN_OR_RAISE(
        auto read_metadata, read_schema_key_value_metadata(read_metadata_key_values));
    ARROW_ASSIGN_OR_RAISE(
        auto field_locations, read_read_table_schema(read_metadata, reader->schema()));

    return ReadTableReader(
        {input}, std::move(reader), field_locations, std::move(read_metadata), pool);
}

}  // namespace pod5


================================================
FILE: c++/pod5_format/read_table_reader.h
================================================
#pragma once

#include "pod5_format/pod5_format_export.h"
#include "pod5_format/read_table_schema.h"
#include "pod5_format/read_table_utils.h"
#include "pod5_format/result.h"
#include "pod5_format/schema_metadata.h"
#include "pod5_format/table_reader.h"
#include "pod5_format/types.h"
#include "pod5_format/uuid.h"

#include <arrow/io/type_fwd.h>
#include <gsl/gsl-lite.hpp>

#include <mutex>

namespace arrow {
class Schema;

namespace io {
class RandomAccessFile;
}

namespace ipc {
class RecordBatchFileReader;
}
}  // namespace arrow

namespace pod5 {

class CalibrationData;
class EndReasonData;
class PoreData;
class RunInfoData;
class ReadIdSearchInput;

struct ReadTableRecordColumns {
    std::shared_ptr<UuidArray> read_id;
    std::shared_ptr<arrow::ListArray> signal;
    std::shared_ptr<arrow::UInt32Array> read_number;
    std::shared_ptr<arrow::UInt64Array> start_sample;
    std::shared_ptr<arrow::FloatArray> median_before;

    std::shared_ptr<arrow::UInt64Array> num_minknow_events;

    [[deprecated]] std::shared_ptr<arrow::FloatArray> tracked_scaling_scale;
    [[deprecated]] std::shared_ptr<arrow::FloatArray> tracked_scaling_shift;
    [[deprecated]] std::shared_ptr<arrow::FloatArray> predicted_scaling_scale;
    [[deprecated]] std::shared_ptr<arrow::FloatArray> predicted_scaling_shift;
    [[deprecated]] std::shared_ptr<arrow::UInt32Array> num_reads_since_mux_change;
    [[deprecated]] std::shared_ptr<arrow::FloatArray> time_since_mux_change;

    std::shared_ptr<arrow::UInt64Array> num_samples;

    std::shared_ptr<arrow::UInt16Array> channel;
    std::shared_ptr<arrow::UInt8Array> well;
    std::shared_ptr<arrow::DictionaryArray> pore_type;
    std::shared_ptr<arrow::FloatArray> calibration_offset;
    std::shared_ptr<arrow::FloatArray> calibration_scale;
    std::shared_ptr<arrow::DictionaryArray> end_reason;
    std::shared_ptr<arrow::BooleanArray> end_reason_forced;
    std::shared_ptr<arrow::DictionaryArray> run_info;

    std::shared_ptr<arrow::FloatArray> open_pore_level;

    TableSpecVersion table_version;
};

class POD5_FORMAT_EXPORT ReadTableRecordBatch : public TableRecordBatch {
public:
    ReadTableRecordBatch(
        std::shared_ptr<arrow::RecordBatch> && batch,
        std::shared_ptr<ReadTableSchemaDescription const> const & field_locations);

    ReadTableRecordBatch(ReadTableRecordBatch &&);

    std::shared_ptr<UuidArray> read_id_column() const;
    std::shared_ptr<arrow::ListArray> signal_column() const;

    Result<std::string> get_pore_type(std::int16_t pore_dict_index) const;
    Result<std::pair<ReadEndReason, std::string>> get_end_reason(
        std::int16_t end_reason_dict_index) const;
    Result<std::string> get_run_info(std::int16_t run_info_dict_index) const;

    Result<ReadTableRecordColumns> columns() const;

    Result<std::shared_ptr<arrow::UInt64Array>> get_signal_rows(std::int64_t batch_row) const;

private:
    std::shared_ptr<ReadTableSchemaDescription const> m_field_locations;

    enum class Dict : std::size_t { Pore, EndReason, RunInfo, Max };
    mutable std::atomic_bool m_dictionary_initialised[static_cast<std::size_t>(Dict::Max)]{};
    mutable std::mutex m_dictionary_access_lock;
    template <Dict which>
    auto & get_dictionary(std::shared_ptr<arrow::DictionaryArray> const & array) const;
};

class POD5_FORMAT_EXPORT ReadTableReader : public TableReader {
public:
    ReadTableReader(
        std::shared_ptr<void> && input_source,
        std::shared_ptr<arrow::ipc::RecordBatchFileReader> && reader,
        std::shared_ptr<ReadTableSchemaDescription const> const & field_locations,
        SchemaMetadataDescription && schema_metadata,
        arrow::MemoryPool * pool);

    ReadTableReader(ReadTableReader && other);
    ReadTableReader & operator=(ReadTableReader && other);

    Result<ReadTableRecordBatch> read_record_batch(std::size_t i) const;

    Result<std::size_t> search_for_read_ids(
        ReadIdSearchInput const & search_input,
        gsl::span<uint32_t> const & batch_counts,
        gsl::span<uint32_t> const & batch_rows) const;

private:
    struct IndexData {
        Uuid id;
        std::size_t batch;
        std::size_t batch_row;
    };

    Status build_read_id_lookup() const;
    mutable std::vector<IndexData> m_sorted_file_read_ids;
    mutable std::mutex m_sorted_file_read_ids_mutex;

private:
    std::shared_ptr<ReadTableSchemaDescription const> m_field_locations;

    mutable std::mutex m_batch_get_mutex;
};

POD5_FORMAT_EXPORT Result<ReadTableReader> make_read_table_reader(
    std::shared_ptr<arrow::io::RandomAccessFile> const & sink,
    arrow::MemoryPool * pool);

}  // namespace pod5


================================================
FILE: c++/pod5_format/read_table_schema.cpp
================================================
#include "pod5_format/read_table_schema.h"

#include "pod5_format/schema_metadata.h"
#include "pod5_format/types.h"

namespace pod5 {

ReadTableSchemaDescription::ReadTableSchemaDescription()
: SchemaDescriptionBase(ReadTableSpecVersion::latest())
// V0 Fields
, read_id(this, "read_id", uuid(), ReadTableSpecVersion::v0())
, signal(this, "signal", arrow::list(arrow::uint64()), ReadTableSpecVersion::v0())
, read_number(this, "read_number", arrow::uint32(), ReadTableSpecVersion::v0())
, start(this, "start", arrow::uint64(), ReadTableSpecVersion::v0())
, median_before(this, "median_before", arrow::float32(), ReadTableSpecVersion::v0())
,
// V1 Fields
num_minknow_events(this, "num_minknow_events", arrow::uint64(), ReadTableSpecVersion::v1())
, tracked_scaling_scale(this, "tracked_scaling_scale", arrow::float32(), ReadTableSpecVersion::v1())
, tracked_scaling_shift(this, "tracked_scaling_shift", arrow::float32(), ReadTableSpecVersion::v1())
, predicted_scaling_scale(
      this,
      "predicted_scaling_scale",
      arrow::float32(),
      ReadTableSpecVersion::v1())
, predicted_scaling_shift(
      this,
      "predicted_scaling_shift",
      arrow::float32(),
      ReadTableSpecVersion::v1())
, num_reads_since_mux_change(
      this,
      "num_reads_since_mux_change",
      arrow::uint32(),
      ReadTableSpecVersion::v1())
, time_since_mux_change(this, "time_since_mux_change", arrow::float32(), ReadTableSpecVersion::v1())
,
// V2 Fields
num_samples(this, "num_samples", arrow::uint64(), ReadTableSpecVersion::v2())
,
// V3 Fields
channel(this, "channel", arrow::uint16(), ReadTableSpecVersion::v3())
, well(this, "well", arrow::uint8(), ReadTableSpecVersion::v3())
, pore_type(
      this,
      "pore_type",
      arrow::dictionary(arrow::int16(), arrow::utf8()),
      ReadTableSpecVersion::v3())
, calibration_offset(this, "calibration_offset", arrow::float32(), ReadTableSpecVersion::v3())
, calibration_scale(this, "calibration_scale", arrow::float32(), ReadTableSpecVersion::v3())
, end_reason(
      this,
      "end_reason",
      arrow::dictionary(arrow::int16(), arrow::utf8()),
      ReadTableSpecVersion::v3())
, end_reason_forced(this, "end_reason_forced", arrow::boolean(), ReadTableSpecVersion::v3())
, run_info(
      this,
      "run_info",
      arrow::dictionary(arrow::int16(), arrow::utf8()),
      ReadTableSpecVersion::v3())
, open_pore_level(this, "open_pore_level", arrow::float32(), ReadTableSpecVersion::v4())
{
}

TableSpecVersion ReadTableSchemaDescription::table_version_from_file_version(
    Version file_version) const
{
    return ReadTableSpecVersion::latest();
}

Result<std::shared_ptr<ReadTableSchemaDescription const>> read_read_table_schema(
    SchemaMetadataDescription const & schema_metadata,
    std::shared_ptr<arrow::Schema> const & schema)
{
    auto result = std::make_shared<ReadTableSchemaDescription>();
    ARROW_RETURN_NOT_OK(ReadTableSchemaDescription::read_schema(result, schema_metadata, schema));

    return result;
}

}  // namespace pod5


================================================
FILE: c++/pod5_format/read_table_schema.h
================================================
#pragma once

#include "pod5_format/pod5_format_export.h"
#include "pod5_format/result.h"
#include "pod5_format/schema_utils.h"
#include "pod5_format/tuple_utils.h"
#include "pod5_format/types.h"

#include <memory>
#include <tuple>
#include <vector>

namespace arrow {
class KeyValueMetadata;
class Schema;
class DataType;
class StructType;
}  // namespace arrow

namespace pod5 {

struct SchemaMetadataDescription;

class ReadTableSpecVersion {
public:
    static TableSpecVersion v0() { return TableSpecVersion::first_version(); }

    static TableSpecVersion v1()
    {
        // Addition of num_minknow_events and scaling parameters
        return TableSpecVersion::at_version(1);
    }

    static TableSpecVersion v2()
    {
        // Addition of num_samples parameters
        return TableSpecVersion::at_version(2);
    }

    static TableSpecVersion v3()
    {
        // Flattening of dictionaries into separate table.
        return TableSpecVersion::at_version(3);
    }

    static TableSpecVersion v4()
    {
        // Flattening of dictionaries into separate table.
        return TableSpecVersion::at_version(4);
    }

    static TableSpecVersion latest() { return v4(); }
};

class ReadTableSchemaDescription : public SchemaDescriptionBase {
public:
    ReadTableSchemaDescription();

    ReadTableSchemaDescription(ReadTableSchemaDescription const &) = delete;
    ReadTableSchemaDescription & operator=(ReadTableSchemaDescription const &) = delete;

    TableSpecVersion table_version_from_file_version(Version file_version) const override;

    // V0 fields
    Field<0, UuidArray> read_id;
    ListField<1, arrow::ListArray, arrow::UInt64Array> signal;
    Field<2, arrow::UInt32Array> read_number;
    Field<3, arrow::UInt64Array> start;
    Field<4, arrow::FloatArray> median_before;

    // V1 fields
    Field<5, arrow::UInt64Array> num_minknow_events;
    [[deprecated]] Field<6, arrow::FloatArray> tracked_scaling_scale;
    [[deprecated]] Field<7, arrow::FloatArray> tracked_scaling_shift;
    [[deprecated]] Field<8, arrow::FloatArray> predicted_scaling_scale;
    [[deprecated]] Field<9, arrow::FloatArray> predicted_scaling_shift;
    [[deprecated]] Field<10, arrow::UInt32Array> num_reads_since_mux_change;
    [[deprecated]] Field<11, arrow::FloatArray> time_since_mux_change;

    // V2 fields
    Field<12, arrow::UInt64Array> num_samples;

    // V3 fields
    Field<13, arrow::UInt16Array> channel;
    Field<14, arrow::UInt8Array> well;
    Field<15, arrow::DictionaryArray> pore_type;
    Field<16, arrow::FloatArray> calibration_offset;
    Field<17, arrow::FloatArray> calibration_scale;
    Field<18, arrow::DictionaryArray> end_reason;
    Field<19, arrow::BooleanArray> end_reason_forced;
    Field<20, arrow::DictionaryArray> run_info;

    // V4 fields
    Field<21, arrow::FloatArray> open_pore_level;

    // Field Builders only for fields we write in newly generated files.
    // Should not include fields which are removed in the latest version:
    using FieldBuilders = FieldBuilder<
        // V0 fields
        decltype(read_id),
        decltype(signal),
        decltype(read_number),
        decltype(start),
        decltype(median_before),

        // V1 fields
        decltype(num_minknow_events),
        decltype(tracked_scaling_scale),
        decltype(tracked_scaling_shift),
        decltype(predicted_scaling_scale),
        decltype(predicted_scaling_shift),
        decltype(num_reads_since_mux_change),
        decltype(time_since_mux_change),

        // V2 fields
        decltype(num_samples),

        // V3 fields
        decltype(channel),
        decltype(well),
        decltype(pore_type),
        decltype(calibration_offset),
        decltype(calibration_scale),
        decltype(end_reason),
        decltype(end_reason_forced),
        decltype(run_info),

        // V4 fields
        decltype(open_pore_level)>;
};

POD5_FORMAT_EXPORT Result<std::shared_ptr<ReadTableSchemaDescription const>> read_read_table_schema(
    SchemaMetadataDescription const & schema_metadata,
    std::shared_ptr<arrow::Schema> const &);

}  // namespace pod5


================================================
FILE: c++/pod5_format/read_table_utils.cpp
================================================
#include "pod5_format/read_table_utils.h"

#include <algorithm>

namespace pod5 {

ReadIdSearchInput::ReadIdSearchInput(gsl::span<Uuid const> const & input_ids)
: m_search_read_ids(input_ids.size())
{
    // Copy in search input:
    for (std::size_t i = 0; i < input_ids.size(); ++i) {
        m_search_read_ids[i].id = input_ids[i];
        m_search_read_ids[i].index = i;
    }

    // Sort input based on read id:
    std::sort(
        m_search_read_ids.begin(), m_search_read_ids.end(), [](auto const & a, auto const & b) {
            return a.id < b.id;
        });
}

}  // namespace pod5


================================================
FILE: c++/pod5_format/read_table_utils.h
================================================
#pragma once

#include "pod5_format/pod5_format_export.h"
#include "pod5_format/uuid.h"

#include <gsl/gsl-lite.hpp>

#include <chrono>
#include <cstdint>
#include <string>
#include <vector>

namespace pod5 {

using PoreDictionaryIndex = std::int16_t;
using EndReasonDictionaryIndex = std::int16_t;
using RunInfoDictionaryIndex = std::int16_t;

class ReadData {
public:
    ReadData() = default;

    /// \brief Create a new read data structure to add to a read.
    /// \param read_id The read id for the read entry.
    /// \param read_number Read number for this read.
    /// \param start_sample The sample which this read starts at.
    /// \param median_before The median of the read chunk prior to the start of this read.
    /// \param end_reason The dictionary index of the end reason name which caused this read to complete.
    /// \param end_reason_forced Boolean value indicating if the read end was forced.
    /// \param run_info The dictionary index of the run info for this read.
    /// \param num_minknow_events The number of minknow events in the read.
    ReadData(
        Uuid const & read_id,
        std::uint32_t read_number,
        std::uint64_t start_sample,
        std::uint16_t channel,
        std::uint8_t well,
        PoreDictionaryIndex pore_type,
        float calibration_offset,
        float calibration_scale,
        float median_before,
        EndReasonDictionaryIndex end_reason,
        bool end_reason_forced,
        RunInfoDictionaryIndex run_info,
        std::uint64_t num_minknow_events,
        float tracked_scaling_scale,
        float tracked_scaling_shift,
        float predicted_scaling_scale,
        float predicted_scaling_shift,
        std::uint32_t num_reads_since_mux_change,
        float time_since_mux_change,
        float open_pore_level)
    : read_id(read_id)
    , read_number(read_number)
    , start_sample(start_sample)
    , median_before(median_before)
    , end_reason(end_reason)
    , end_reason_forced(end_reason_forced)
    , run_info(run_info)
    , num_minknow_events(num_minknow_events)
    , tracked_scaling_scale(tracked_scaling_scale)
    , tracked_scaling_shift(tracked_scaling_shift)
    , predicted_scaling_scale(predicted_scaling_scale)
    , predicted_scaling_shift(predicted_scaling_shift)
    , num_reads_since_mux_change(num_reads_since_mux_change)
    , time_since_mux_change(time_since_mux_change)
    , channel(channel)
    , well(well)
    , pore_type(pore_type)
    , calibration_offset(calibration_offset)
    , calibration_scale(calibration_scale)
    , open_pore_level(open_pore_level)
    {
    }

    // V1 Fields
    Uuid read_id;
    std::uint32_t read_number;
    std::uint64_t start_sample;
    float median_before;
    EndReasonDictionaryIndex end_reason;
    bool end_reason_forced;
    RunInfoDictionaryIndex run_info;

    // V2 Fields
    std::uint64_t num_minknow_events;
    [[deprecated]] float tracked_scaling_scale;
    [[deprecated]] float tracked_scaling_shift;
    [[deprecated]] float predicted_scaling_scale;
    [[deprecated]] float predicted_scaling_shift;
    [[deprecated]] std::uint32_t num_reads_since_mux_change;
    [[deprecated]] float time_since_mux_change;

    // V3 Fields
    std::uint16_t channel;
    std::uint8_t well;
    PoreDictionaryIndex pore_type;
    float calibration_offset;
    float calibration_scale;

    // V4 Fields
    float open_pore_level;
};

inline bool operator==(ReadData const & a, ReadData const & b)
{
    return a.read_id == b.read_id && a.read_number == b.read_number
           && a.start_sample == b.start_sample && a.median_before == b.median_before
           && a.end_reason == b.end_reason && a.end_reason_forced == b.end_reason_forced
           && a.run_info == b.run_info && a.num_minknow_events == b.num_minknow_events
           && a.tracked_scaling_scale == b.tracked_scaling_scale
           && a.tracked_scaling_shift == b.tracked_scaling_shift
           && a.predicted_scaling_scale == b.predicted_scaling_scale
           && a.predicted_scaling_shift == b.predicted_scaling_shift
           && a.num_reads_since_mux_change == b.num_reads_since_mux_change
           && a.time_since_mux_change == b.time_since_mux_change && a.channel == b.channel
           && a.well == b.well && a.pore_type == b.pore_type
           && a.calibration_offset == b.calibration_offset
           && a.calibration_scale == b.calibration_scale && a.open_pore_level == b.open_pore_level;
}

class RunInfoData {
public:
    using MapType = std::vector<std::pair<std::string, std::string>>;

    RunInfoData(
        std::string acquisition_id,
        std::int64_t acquisition_start_time,
        std::int16_t adc_max,
        std::int16_t adc_min,
        MapType context_tags,
        std::string experiment_name,
        std::string flow_cell_id,
        std::string flow_cell_product_code,
        std::string protocol_name,
        std::string protocol_run_id,
        std::int64_t protocol_start_time,
        std::string sample_id,
        std::uint16_t sample_rate,
        std::string sequencing_kit,
        std::string sequencer_position,
        std::string sequencer_position_type,
        std::string software,
        std::string system_name,
        std::string system_type,
        MapType tracking_id)
    : acquisition_id(std::move(acquisition_id))
    , acquisition_start_time(std::move(acquisition_start_time))
    , adc_max(std::move(adc_max))
    , adc_min(std::move(adc_min))
    , context_tags(std::move(context_tags))
    , experiment_name(std::move(experiment_name))
    , flow_cell_id(std::move(flow_cell_id))
    , flow_cell_product_code(std::move(flow_cell_product_code))
    , protocol_name(std::move(protocol_name))
    , protocol_run_id(std::move(protocol_run_id))
    , protocol_start_time(std::move(protocol_start_time))
    , sample_id(std::move(sample_id))
    , sample_rate(std::move(sample_rate))
    , sequencing_kit(std::move(sequencing_kit))
    , sequencer_position(std::move(sequencer_position))
    , sequencer_position_type(std::move(sequencer_position_type))
    , software(std::move(software))
    , system_name(std::move(system_name))
    , system_type(std::move(system_type))
    , tracking_id(std::move(tracking_id))
    {
    }

    static std::int64_t convert_from_system_clock(std::chrono::system_clock::time_point value)
    {
        return value.time_since_epoch() / std::chrono::milliseconds(1);
    }

    static std::chrono::system_clock::time_point convert_to_system_clock(
        std::int64_t since_epoch_ms)
    {
        return std::chrono::system_clock::time_point() + std::chrono::milliseconds(since_epoch_ms);
    }

    std::string acquisition_id;
    std::int64_t acquisition_start_time;
    std::int16_t adc_max;
    std::int16_t adc_min;
    MapType context_tags;
    std::string experiment_name;
    std::string flow_cell_id;
    std::string flow_cell_product_code;
    std::string protocol_name;
    std::string protocol_run_id;
    std::int64_t protocol_start_time;
    std::string sample_id;
    std::uint16_t sample_rate;
    std::string sequencing_kit;
    std::string sequencer_position;
    std::string sequencer_position_type;
    std::string software;
    std::string system_name;
    std::string system_type;
    MapType tracking_id;
};

inline bool operator==(RunInfoData const & a, RunInfoData const & b)
{
    return a.acquisition_id == b.acquisition_id
           && a.acquisition_start_time == b.acquisition_start_time && a.adc_max == b.adc_max
           && a.adc_min == b.adc_min && a.context_tags == b.context_tags
           && a.experiment_name == b.experiment_name && a.flow_cell_id == b.flow_cell_id
           && a.flow_cell_product_code == b.flow_cell_product_code
           && a.protocol_name == b.protocol_name && a.protocol_run_id == b.protocol_run_id
           && a.protocol_start_time == b.protocol_start_time && a.sample_id == b.sample_id
           && a.sample_rate == b.sample_rate && a.sequencing_kit == b.sequencing_kit
           && a.sequencer_position == b.sequencer_position
           && a.sequencer_position_type == b.sequencer_position_type && a.software == b.software
           && a.system_name == b.system_name && a.system_type == b.system_type
           && a.tracking_id == b.tracking_id;
}

enum class ReadEndReason : std::uint8_t {
    unknown,
    mux_change,
    unblock_mux_change,
    data_service_unblock_mux_change,
    signal_positive,
    signal_negative,
    api_request,
    device_data_error,
    analysis_config_change,
    paused,

    last_end_reason = paused
};

inline char const * end_reason_as_string(ReadEndReason reason)
{
    static_assert(
        ReadEndReason::last_end_reason == ReadEndReason::paused,
        "Need to add new end reason to this function");
    switch (reason) {
    case ReadEndReason::mux_change:
        return "mux_change";
    case ReadEndReason::unblock_mux_change:
        return "unblock_mux_change";
    case ReadEndReason::data_service_unblock_mux_change:
        return "data_service_unblock_mux_change";
    case ReadEndReason::signal_positive:
        return "signal_positive";
    case ReadEndReason::signal_negative:
        return "signal_negative";
    case ReadEndReason::api_request:
        return "api_request";
    case ReadEndReason::device_data_error:
        return "device_data_error";
    case ReadEndReason::analysis_config_change:
        return "analysis_config_change";
    case ReadEndReason::paused:
        return "paused";
    case ReadEndReason::unknown:
        break;
    }
    return "unknown";
}

inline ReadEndReason end_reason_from_string(std::string const & reason)
{
    static_assert(
        ReadEndReason::last_end_reason == ReadEndReason::paused,
        "Need to add new end reason to this function");
    if (reason == "unknown") {
        return ReadEndReason::unknown;
    } else if (reason == "mux_change") {
        return ReadEndReason::mux_change;
    } else if (reason == "unblock_mux_change") {
        return ReadEndReason::unblock_mux_change;
    } else if (reason == "data_service_unblock_mux_change") {
        return ReadEndReason::data_service_unblock_mux_change;
    } else if (reason == "signal_positive") {
        return ReadEndReason::signal_positive;
    } else if (reason == "signal_negative") {
        return ReadEndReason::signal_negative;
    } else if (reason == "api_request") {
        return ReadEndReason::api_request;
    } else if (reason == "device_data_error") {
        return ReadEndReason::device_data_error;
    } else if (reason == "analysis_config_change") {
        return ReadEndReason::analysis_config_change;
    } else if (reason == "paused") {
        return ReadEndReason::paused;
    }

    return ReadEndReason::unknown;
}

/// \brief Input query to a search for a number of read ids in a file:
class POD5_FORMAT_EXPORT ReadIdSearchInput {
public:
    struct InputId {
        Uuid id;
        std::size_t index;
    };

    ReadIdSearchInput(gsl::span<Uuid const> const & input_ids);

    std::size_t read_id_count() const { return m_search_read_ids.size(); }

    InputId const & operator[](std::size_t i) const { return m_search_read_ids[i]; }

private:
    std::vector<InputId> m_search_read_ids;
};

}  // namespace pod5


================================================
FILE: c++/pod5_format/read_table_writer.cpp
================================================
#include "pod5_format/read_table_writer.h"

#include "pod5_format/file_output_stream.h"
#include "pod5_format/internal/tracing/tracing.h"

#include <arrow/extension_type.h>
#include <arrow/ipc/writer.h>
#include <arrow/record_batch.h>
#include <arrow/type.h>
#include <arrow/util/compression.h>

namespace pod5 {

ReadTableWriter::ReadTableWriter(
    std::shared_ptr<arrow::ipc::RecordBatchWriter> && writer,
    std::shared_ptr<arrow::Schema> && schema,
    std::shared_ptr<ReadTableSchemaDescription> const & field_locations,
    std::size_t table_batch_size,
    std::shared_ptr<PoreWriter> const & pore_writer,
    std::shared_ptr<EndReasonWriter> const & end_reason_writer,
    std::shared_ptr<RunInfoWriter> const & run_info_writer,
    std::shared_ptr<FileOutputStream> const & output_stream,
    arrow::MemoryPool * pool)
: m_schema(schema)
, m_field_locations(field_locations)
, m_table_batch_size(table_batch_size)
, m_writer(std::move(writer))
, m_field_builders(m_field_locations, pool)
, m_output_stream{output_stream}
{
    m_field_builders.get_builder(m_field_locations->pore_type).set_dict_writer(pore_writer);
    m_field_builders.get_builder(m_field_locations->end_reason).set_dict_writer(end_reason_writer);
    m_field_builders.get_builder(m_field_locations->run_info).set_dict_writer(run_info_writer);
}

ReadTableWriter::ReadTableWriter(ReadTableWriter && other) = default;
ReadTableWriter & ReadTableWriter::operator=(ReadTableWriter &&) = default;

ReadTableWriter::~ReadTableWriter()
{
    if (m_writer) {
        (void)close();
    }
}

Result<std::size_t> ReadTableWriter::add_read(
    ReadData const & read_data,
    gsl::span<SignalTableRowIndex const> const & signal,
    std::uint64_t signal_duration)
{
    POD5_TRACE_FUNCTION();
    if (!m_writer) {
        return Status::IOError("Writer terminated");
    }

    ARROW_RETURN_NOT_OK(reserve_rows());

    auto row_id = m_written_batched_row_count + m_current_batch_row_count;
    ARROW_RETURN_NOT_OK(m_field_builders.append(
        // V0 Fields
        read_data.read_id,
        signal,
        read_data.read_number,
        read_data.start_sample,
        read_data.median_before,

        // V1 Fields
        read_data.num_minknow_events,
        read_data.tracked_scaling_scale,
        read_data.tracked_scaling_shift,
        read_data.predicted_scaling_scale,
        read_data.predicted_scaling_shift,
        read_data.num_reads_since_mux_change,
        read_data.time_since_mux_change,

        // V2 Fields
        signal_duration,

        // V3 Fields
        read_data.channel,
        read_data.well,
        read_data.pore_type,
        read_data.calibration_offset,
        read_data.calibration_scale,
        read_data.end_reason,
        read_data.end_reason_forced,
        read_data.run_info,

        // V4 Fields
        read_data.open_pore_level));

    ++m_current_batch_row_count;

    if (m_current_batch_row_count >= m_table_batch_size) {
        ARROW_RETURN_NOT_OK(write_batch());
    }
    return row_id;
}

Status ReadTableWriter::close()
{
    // Check for already closed
    if (!m_writer) {
        return Status::OK();
    }

    ARROW_RETURN_NOT_OK(write_batch());
    ARROW_RETURN_NOT_OK(m_writer->Close());
    m_writer = nullptr;
    return Status::OK();
}

Status ReadTableWriter::write_batch(arrow::RecordBatch const & record_batch)
{
    ARROW_RETURN_NOT_OK(m_writer->WriteRecordBatch(record_batch));
    return m_output_stream->batch_complete();
}

Status ReadTableWriter::write_batch()
{
    POD5_TRACE_FUNCTION();
    if (m_current_batch_row_count == 0) {
        return Status::OK();
    }

    if (!m_writer) {
        return Status::IOError("Writer terminated");
    }

    ARROW_ASSIGN_OR_RAISE(auto columns, m_field_builders.finish_columns());

    auto const record_batch =
        arrow::RecordBatch::Make(m_schema, m_current_batch_row_count, std::move(columns));

    m_written_batched_row_count += m_current_batch_row_count;
    m_current_batch_row_count = 0;

    ARROW_RETURN_NOT_OK(m_writer->WriteRecordBatch(*record_batch));
    return m_output_stream->batch_complete();
}

Status ReadTableWriter::reserve_rows()
{
    // Only reserve if we have not already reserved (at the start of a batch)
    if (m_current_batch_row_count > 0) {
        return arrow::Status::OK();
    }

    return m_field_builders.reserve(m_table_batch_size);
}

Result<ReadTableWriter> make_read_table_writer(
    std::shared_ptr<FileOutputStream> const & sink,
    std::shared_ptr<arrow::KeyValueMetadata const> const & metadata,
    std::size_t table_batch_size,
    std::shared_ptr<PoreWriter> const & pore_writer,
    std::shared_ptr<EndReasonWriter> const & end_reason_writer,
    std::shared_ptr<RunInfoWriter> const & run_info_writer,
    arrow::MemoryPool * pool)
{
    auto field_locations = std::make_shared<ReadTableSchemaDescription>();
    auto schema = field_locations->make_writer_schema(metadata);

    arrow::ipc::IpcWriteOptions options;
    options.memory_pool = pool;
    options.emit_dictionary_deltas = true;
    // todo... consider:
    //ARROW_ASSIGN_OR_RAISE(options.codec, arrow::util::Codec::Create(arrow::Compression::LZ4_FRAME));

    ARROW_ASSIGN_OR_RAISE(auto writer, arrow::ipc::MakeFileWriter(sink, schema, options, metadata));

    auto read_table_writer = ReadTableWriter(
        std::move(writer),
        std::move(schema),
        field_locations,
        table_batch_size,
        pore_writer,
        end_reason_writer,
        run_info_writer,
        sink,
        pool);

    return read_table_writer;
}

}  // namespace pod5


================================================
FILE: c++/pod5_format/read_table_writer.h
================================================
#pragma once

#include "pod5_format/pod5_format_export.h"
#include "pod5_format/read_table_schema.h"
#include "pod5_format/read_table_writer_utils.h"
#include "pod5_format/result.h"
#include "pod5_format/schema_field_builder.h"
#include "pod5_format/signal_table_utils.h"

#include <arrow/array/builder_dict.h>
#include <arrow/io/type_fwd.h>

namespace arrow {
class Schema;

namespace ipc {
class RecordBatchWriter;
}
}  // namespace arrow

namespace pod5 {

class FileOutputStream;

class POD5_FORMAT_EXPORT ReadTableWriter {
public:
    ReadTableWriter(
        std::shared_ptr<arrow::ipc::RecordBatchWriter> && writer,
        std::shared_ptr<arrow::Schema> && schema,
        std::shared_ptr<ReadTableSchemaDescription> const & field_locations,
        std::size_t table_batch_size,
        std::shared_ptr<PoreWriter> const & pore_writer,
        std::shared_ptr<EndReasonWriter> const & end_reason_writer,
        std::shared_ptr<RunInfoWriter> const & run_info_writer,
        std::shared_ptr<FileOutputStream> const & output_stream,
        arrow::MemoryPool * pool);
    ReadTableWriter(ReadTableWriter &&);
    ReadTableWriter & operator=(ReadTableWriter &&);
    ReadTableWriter(ReadTableWriter const &) = delete;
    ReadTableWriter & operator=(ReadTableWriter const &) = delete;
    ~ReadTableWriter();

    /// \brief Add a read to the read table, adding to the current batch.
    /// \param read_data The data to add as a read.
    /// \param signal List of signal table row indices that belong to this read.
    /// \param signal_duration The length of the read in samples.
    /// \returns The row index of the inserted read, or a status on failure.
    Result<std::size_t> add_read(
        ReadData const & read_data,
        gsl::span<SignalTableRowIndex const> const & signal,
        std::uint64_t signal_duration);

    /// \brief Close this writer, signaling no further data will be written to the writer.
    Status close();

    /// \brief Reserve space for future row writes, called automatically when a flush occurs.
    Status reserve_rows();

    /// \brief Find the schema for the table
    std::shared_ptr<arrow::Schema> const & schema() const { return m_schema; }

    /// \brief Flush passed data into the writer as a record batch.
    Status write_batch(arrow::RecordBatch const &);

private:
    /// \brief Flush buffered data into the writer as a record batch.
    Status write_batch();

    std::shared_ptr<arrow::Schema> m_schema;
    std::shared_ptr<ReadTableSchemaDescription> m_field_locations;
    std::size_t m_table_batch_size;

    std::shared_ptr<arrow::ipc::RecordBatchWriter> m_writer;

    ReadTableSchemaDescription::FieldBuilders m_field_builders;

    std::size_t m_written_batched_row_count = 0;
    std::size_t m_current_batch_row_count = 0;
    std::shared_ptr<FileOutputStream> m_output_stream;
};

/// \brief Make a new writer for a read table.
/// \param sink Sink to be used for output of the table.
/// \param metadata Metadata to be applied to the table schema.
/// \param table_batch_size The size of each batch written for the table.
/// \param pool Pool to be used for building table in memory.
/// \returns The writer for the new table.
POD5_FORMAT_EXPORT Result<ReadTableWriter> make_read_table_writer(
    std::shared_ptr<FileOutputStream> const & sink,
    std::shared_ptr<arrow::KeyValueMetadata const> const & metadata,
    std::size_t table_batch_size,
    std::shared_ptr<PoreWriter> const & pore_writer,
    std::shared_ptr<EndReasonWriter> const & end_reason_writer,
    std::shared_ptr<RunInfoWriter> const & run_info_writer,
    arrow::MemoryPool * pool);

}  // namespace pod5


================================================
FILE: c++/pod5_format/read_table_writer_utils.cpp
================================================
#include "pod5_format/read_table_writer_utils.h"

#include "pod5_format/read_table_schema.h"

#include <arrow/array/array_dict.h>
#include <arrow/array/builder_binary.h>
#include <arrow/array/builder_nested.h>
#include <arrow/array/builder_primitive.h>

namespace pod5 {

namespace detail {

arrow::Result<std::shared_ptr<arrow::ArrayData>> get_array_data(
    std::shared_ptr<arrow::DataType> const & type,
    StringDictionaryKeyBuilder const & builder,
    std::size_t expected_length)
{
    auto const value_data = builder.get_string_data();
    if (!value_data) {
        return Status::Invalid("Missing array value data for dictionary");
    }

    arrow::TypedBufferBuilder<std::int32_t> offset_builder;
    auto const & offset_data = builder.get_typed_offset_data();
    if (offset_data.size() != expected_length) {
        return Status::Invalid("Invalid size for field in struct");
    }
    ARROW_RETURN_NOT_OK(offset_builder.Append(offset_data.data(), offset_data.size()));
    // Append final offset - size of value data.
    ARROW_RETURN_NOT_OK(offset_builder.Append(value_data->size()));

    std::shared_ptr<arrow::Buffer> offsets;
    ARROW_RETURN_NOT_OK(offset_builder.Finish(&offsets));

    return arrow::ArrayData::Make(type, expected_length, {nullptr, offsets, value_data}, 0, 0);
}

}  // namespace detail

arrow::Result<std::shared_ptr<PoreWriter>> make_pore_writer(arrow::MemoryPool * pool)
{
    return std::make_shared<PoreWriter>(pool);
}

arrow::Result<std::shared_ptr<EndReasonWriter>> make_end_reason_writer(arrow::MemoryPool * pool)
{
    std::shared_ptr<arrow::StringArray> end_reasons;
    {
        arrow::StringBuilder builder(pool);
        for (int end_reason = 0; end_reason <= (int)ReadEndReason::last_end_reason; ++end_reason) {
            ARROW_RETURN_NOT_OK(builder.Append(end_reason_as_string((ReadEndReason)end_reason)));
        }

        ARROW_RETURN_NOT_OK(builder.Finish(&end_reasons));
    }

    return std::make_shared<EndReasonWriter>(end_reasons);
}

arrow::Result<std::shared_ptr<RunInfoWriter>> make_run_info_writer(arrow::MemoryPool * pool)
{
    return std::make_shared<RunInfoWriter>(pool);
}

pod5::Result<std::shared_ptr<arrow::Array>> DictionaryWriter::build_dictionary_array(
    std::shared_ptr<arrow::Array> const & indices)
{
    ARROW_ASSIGN_OR_RAISE(auto res, get_value_array());
    return arrow::DictionaryArray::FromArrays(indices, res);
}

PoreWriter::PoreWriter(arrow::MemoryPool * pool) : m_builder(pool) {}

pod5::Result<std::shared_ptr<arrow::Array>> PoreWriter::get_value_array()
{
    ARROW_ASSIGN_OR_RAISE(auto array_data, get_array_data(arrow::utf8(), m_builder, item_count()));
    return std::make_shared<arrow::StringArray>(array_data);
}

std::size_t PoreWriter::item_count() { return m_builder.length(); }

EndReasonWriter::EndReasonWriter(std::shared_ptr<arrow::StringArray> const & end_reasons)
: m_end_reasons(end_reasons)
{
}

pod5::Result<std::shared_ptr<arrow::Array>> EndReasonWriter::get_value_array()
{
    return m_end_reasons;
}

std::size_t EndReasonWriter::item_count() { return m_end_reasons->length(); }

RunInfoWriter::RunInfoWriter(arrow::MemoryPool * pool) : m_builder(pool) {}

pod5::Result<std::shared_ptr<arrow::Array>> RunInfoWriter::get_value_array()
{
    ARROW_ASSIGN_OR_RAISE(auto array_data, get_array_data(arrow::utf8(), m_builder, item_count()));
    return std::make_shared<arrow::StringArray>(array_data);
}

std::size_t RunInfoWriter::item_count() { return m_builder.length(); }

}  // namespace pod5


================================================
FILE: c++/pod5_format/read_table_writer_utils.h
================================================
#pragma once

#include "pod5_format/dictionary_writer.h"
#include "pod5_format/expandable_buffer.h"
#include "pod5_format/pod5_format_export.h"
#include "pod5_format/read_table_utils.h"
#include "pod5_format/result.h"
#include "pod5_format/tuple_utils.h"

#include <arrow/array/array_binary.h>
#include <arrow/io/type_fwd.h>
#include <arrow/util/bit_util.h>
#include <gsl/gsl-lite.hpp>

#include <chrono>
#include <cstdint>
#include <map>

namespace pod5 {

namespace detail {

class StringDictionaryKeyBuilder {
public:
    StringDictionaryKeyBuilder(arrow::MemoryPool * pool = nullptr)
    : m_offset_values(pool)
    , m_string_values(pool)
    {
    }

    arrow::Status init_buffer(arrow::MemoryPool * pool)
    {
        ARROW_RETURN_NOT_OK(m_offset_values.init_buffer(pool));
        return m_string_values.init_buffer(pool);
    }

    arrow::Status append(std::string const & value)
    {
        ARROW_RETURN_NOT_OK(m_offset_values.append(m_string_values.size()));
        return m_string_values.append_array(
            gsl::make_span(value.data(), value.size()).as_span<std::uint8_t const>());
    }

    std::size_t length() const { return m_offset_values.size(); }

    std::shared_ptr<arrow::Buffer> get_string_data() const { return m_string_values.get_buffer(); }

    gsl::span<std::int32_t const> get_typed_offset_data() const
    {
        return m_offset_values.get_data_span();
    }

private:
    ExpandableBuffer<std::int32_t> m_offset_values;
    ExpandableBuffer<std::uint8_t> m_string_values;
};

}  // namespace detail

class POD5_FORMAT_EXPORT PoreWriter : public DictionaryWriter {
public:
    PoreWriter(arrow::MemoryPool * pool);

    pod5::Result<PoreDictionaryIndex> add(std::string const & pore_type)
    {
        auto const index = item_count();

        if (index >= std::size_t(std::numeric_limits<std::int16_t>::max())) {
            return arrow::Status::Invalid(
                "Failed to add pore to dictionary, too many indices in file");
        }

        ARROW_RETURN_NOT_OK(m_builder.append(pore_type));
        return index;
    }

    pod5::Result<std::shared_ptr<arrow::Array>> get_value_array() override;
    std::size_t item_count() override;

private:
    detail::StringDictionaryKeyBuilder m_builder;
};

class POD5_FORMAT_EXPORT EndReasonWriter : public DictionaryWriter {
public:
    EndReasonWriter(std::shared_ptr<arrow::StringArray> const & end_reasons);

    pod5::Result<EndReasonDictionaryIndex> lookup(ReadEndReason end_reason) const
    {
        if (end_reason > ReadEndReason::last_end_reason) {
            return pod5::Status::Invalid("Invalid read end reason requested");
        }
        return EndReasonDictionaryIndex(end_reason);
    }

    pod5::Result<std::shared_ptr<arrow::Array>> get_value_array() override;
    std::size_t item_count() override;

private:
    std::shared_ptr<arrow::StringArray> m_end_reasons;
};

class POD5_FORMAT_EXPORT RunInfoWriter : public DictionaryWriter {
public:
    RunInfoWriter(arrow::MemoryPool * pool);

    pod5::Result<RunInfoDictionaryIndex> add(std::string const & acquisition_id)
    {
        auto const index = item_count();

        if (index >= std::size_t(std::numeric_limits<std::int16_t>::max())) {
            return arrow::Status::Invalid(
                "Failed to add run info to dictionary, too many indices in file");
        }

        ARROW_RETURN_NOT_OK(m_builder.append(acquisition_id));
        return index;
    }

    pod5::Result<std::shared_ptr<arrow::Array>> get_value_array() override;
    std::size_t item_count() override;

private:
    detail::StringDictionaryKeyBuilder m_builder;
};

POD5_FORMAT_EXPORT arrow::Result<std::shared_ptr<PoreWriter>> make_pore_writer(
    arrow::MemoryPool * pool);

POD5_FORMAT_EXPORT arrow::Result<std::shared_ptr<EndReasonWriter>> make_end_reason_writer(
    arrow::MemoryPool * pool);

POD5_FORMAT_EXPORT arrow::Result<std::shared_ptr<RunInfoWriter>> make_run_info_writer(
    arrow::MemoryPool * pool);

}  // namespace pod5


================================================
FILE: c++/pod5_format/result.h
================================================
#pragma once

#include <arrow/result.h>

namespace pod5 {

/// pod5::Result is just an Arrow Result right now.
template <typename R>
using Result = arrow::Result<R>;
using Status = arrow::Status;

}  // namespace pod5


================================================
FILE: c++/pod5_format/run_info_table_reader.cpp
================================================
#include "pod5_format/run_info_table_reader.h"

#include "pod5_format/schema_metadata.h"
#include "pod5_format/schema_utils.h"

#include <arrow/array/array_binary.h>
#include <arrow/array/array_dict.h>
#include <arrow/array/array_nested.h>
#include <arrow/array/array_primitive.h>
#include <arrow/ipc/reader.h>

#include <algorithm>

namespace pod5 {

inline std::vector<std::pair<std::string, std::string>> value_for_map(
    std::shared_ptr<arrow::MapArray> const & map_array,
    std::size_t row_index)
{
    std::size_t offset = map_array->value_offset(row_index);
    std::size_t length = map_array->value_length(row_index);

    auto const & keys = std::dynamic_pointer_cast<arrow::StringArray>(map_array->keys());
    auto const & items = std::dynamic_pointer_cast<arrow::StringArray>(map_array->items());

    std::vector<std::pair<std::string, std::string>> result;
    for (std::size_t i = offset; i < offset + length; ++i) {
        result.push_back(std::make_pair(keys->GetString(i), items->GetString(i)));
    }
    return result;
}

RunInfoTableRecordBatch::RunInfoTableRecordBatch(
    std::shared_ptr<arrow::RecordBatch> && batch,
    std::shared_ptr<RunInfoTableSchemaDescription const> const & field_locations)
: TableRecordBatch(std::move(batch))
, m_field_locations(field_locations)
{
}

RunInfoTableRecordBatch::RunInfoTableRecordBatch(RunInfoTableRecordBatch && other)
: TableRecordBatch(std::move(other))
{
    m_field_locations = std::move(other.m_field_locations);
}

RunInfoTableRecordBatch & RunInfoTableRecordBatch::operator=(RunInfoTableRecordBatch && other)
{
    TableRecordBatch & base = *this;
    base = other;

    m_field_locations = std::move(other.m_field_locations);
    return *this;
}

Result<RunInfoTableRecordColumns> RunInfoTableRecordBatch::columns() const
{
    RunInfoTableRecordColumns result;
    result.table_version = m_field_locations->table_version();

    auto const & bat = batch();

    // V0 fields:
    result.acquisition_id = find_column(bat, m_field_locations->acquisition_id);
    result.acquisition_start_time = find_column(bat, m_field_locations->acquisition_start_time);
    result.adc_max = find_column(bat, m_field_locations->adc_max);
    result.adc_min = find_column(bat, m_field_locations->adc_min);
    result.context_tags = find_column(bat, m_field_locations->context_tags);
    result.experiment_name = find_column(bat, m_field_locations->experiment_name);
    result.flow_cell_id = find_column(bat, m_field_locations->flow_cell_id);
    result.flow_cell_product_code = find_column(bat, m_field_locations->flow_cell_product_code);
    result.protocol_name = find_column(bat, m_field_locations->protocol_name);
    result.protocol_run_id = find_column(bat, m_field_locations->protocol_run_id);
    result.protocol_start_time = find_column(bat, m_field_locations->protocol_start_time);
    result.sample_id = find_column(bat, m_field_locations->sample_id);
    result.sample_rate = find_column(bat, m_field_locations->sample_rate);
    result.sequencing_kit = find_column(bat, m_field_locations->sequencing_kit);
    result.sequencer_position = find_column(bat, m_field_locations->sequencer_position);
    result.sequencer_position_type = find_column(bat, m_field_locations->sequencer_position_type);
    result.software = find_column(bat, m_field_locations->software);
    result.system_name = find_column(bat, m_field_locations->system_name);
    result.system_type = find_column(bat, m_field_locations->system_type);
    result.tracking_id = find_column(bat, m_field_locations->tracking_id);

    return result;
}

//---------------------------------------------------------------------------------------------------------------------

RunInfoTableReader::RunInfoTableReader(
    std::shared_ptr<void> && input_source,
    std::shared_ptr<arrow::ipc::RecordBatchFileReader> && reader,
    std::shared_ptr<RunInfoTableSchemaDescription const> const & field_locations,
    SchemaMetadataDescription && schema_metadata,
    arrow::MemoryPool * pool)
: TableReader(std::move(input_source), std::move(reader), std::move(schema_metadata), pool)
, m_field_locations(field_locations)
{
}

RunInfoTableReader::RunInfoTableReader(RunInfoTableReader && other)
: TableReader(std::move(other))
, m_field_locations(std::move(other.m_field_locations))
{
}

RunInfoTableReader & RunInfoTableReader::operator=(RunInfoTableReader && other)
{
    static_cast<TableReader &>(*this) = std::move(static_cast<TableReader &>(*this));
    m_field_locations = std::move(other.m_field_locations);
    return *this;
}

Result<RunInfoTableRecordBatch> RunInfoTableReader::read_record_batch(std::size_t i) const
{
    std::lock_guard<std::mutex> l(m_batch_get_mutex);
    ARROW_ASSIGN_OR_RAISE(auto record_batch, TableReader::ReadRecordBatch(i));
    return RunInfoTableRecordBatch{std::move(record_batch), m_field_locations};
}

Result<std::shared_ptr<RunInfoData const>> RunInfoTableReader::find_run_info(
    std::string const & acquisition_id) const
{
    std::lock_guard<std::mutex> l(m_run_info_lookup_mutex);
    auto it = m_run_info_lookup.find(acquisition_id);
    if (it != m_run_info_lookup.end()) {
        return it->second;
    }

    ARROW_RETURN_NOT_OK(prepare_run_infos_vector());

    std::shared_ptr<RunInfoData const> run_info = nullptr;
    std::size_t glb_run_info_index = 0;
    for (std::size_t i = 0; i < num_record_batches(); ++i) {
        ARROW_ASSIGN_OR_RAISE(auto batch, read_record_batch(i));
        auto acq_id = find_column(batch.batch(), m_field_locations->acquisition_id);

        for (std::size_t j = 0; j < batch.num_rows(); ++j) {
            if (acq_id->Value(j) == acquisition_id) {
                ARROW_ASSIGN_OR_RAISE(
                    run_info, load_run_info_from_batch(batch, j, glb_run_info_index++));
                break;
            }
        }

        if (run_info) {
            break;
        }
    }

    if (!run_info) {
        return arrow::Status::Invalid(
            "Failed to find acquisition id '", acquisition_id, "' in run info table");
    }

    return run_info;
}

Result<std::shared_ptr<RunInfoData const>> RunInfoTableReader::get_run_info(std::size_t index) const
{
    ARROW_RETURN_NOT_OK(prepare_run_infos_vector());

    if (index < 0 || index >= m_run_infos.size()) {
        return arrow::Status::IndexError(
            "Invalid index into run infos (expected ", index, " < ", m_run_infos.size(), ")");
    }

    if (m_run_infos[index]) {
        return m_run_infos[index];
    }

    ARROW_ASSIGN_OR_RAISE(auto first_batch, read_record_batch(0));
    auto const batch_size = first_batch.num_rows();

    auto const batch_idx = index / batch_size;
    auto const batch_row = index - (batch_idx * batch_size);

    if (batch_idx >= num_record_batches()) {
        return Status::Invalid("Row outside batch bounds");
    }

    ARROW_ASSIGN_OR_RAISE(auto batch, read_record_batch(batch_idx));

    return load_run_info_from_batch(batch, batch_row, index);
}

Result<std::size_t> RunInfoTableReader::get_run_info_count() const
{
    auto batch_count = num_record_batches();
    if (batch_count == 0) {
        return 0;
    }

    ARROW_ASSIGN_OR_RAISE(auto first_batch, read_record_batch(0));
    ARROW_ASSIGN_OR_RAISE(auto last_batch, read_record_batch(batch_count - 1));

    return (batch_count - 1) * first_batch.num_rows() + last_batch.num_rows();
}

Result<std::shared_ptr<RunInfoData const>> RunInfoTableReader::load_run_info_from_batch(
    RunInfoTableRecordBatch const & batch,
    std::size_t batch_index,
    std::size_t global_index) const
{
    ARROW_ASSIGN_OR_RAISE(auto columns, batch.columns());

    auto acquisition_id = columns.acquisition_id->GetString(batch_index);
    auto run_info = std::make_shared<RunInfoData>(
        acquisition_id,
        columns.acquisition_start_time->Value(batch_index),
        columns.adc_max->Value(batch_index),
        columns.adc_min->Value(batch_index),
        value_for_map(columns.context_tags, batch_index),
        columns.experiment_name->GetString(batch_index),
        columns.flow_cell_id->GetString(batch_index),
        columns.flow_cell_product_code->GetString(batch_index),
        columns.protocol_name->GetString(batch_index),
        columns.protocol_run_id->GetString(batch_index),
        columns.protocol_start_time->Value(batch_index),
        columns.sample_id->GetString(batch_index),
        columns.sample_rate->Value(batch_index),
        columns.sequencing_kit->GetString(batch_index),
        columns.sequencer_position->GetString(batch_index),
        columns.sequencer_position_type->GetString(batch_index),
        columns.software->GetString(batch_index),
        columns.system_name->GetString(batch_index),
        columns.system_type->GetString(batch_index),
        value_for_map(columns.tracking_id, batch_index));

    // Cache run info for later retrieval by index:
    m_run_infos[global_index] = run_info;
    m_run_info_lookup[acquisition_id] = run_info;
    return run_info;
}

arrow::Status RunInfoTableReader::prepare_run_infos_vector() const
{
    if (m_run_infos.empty()) {
        ARROW_ASSIGN_OR_RAISE(auto row_count, get_run_info_count())
        m_run_infos.resize(row_count);
    }

    return Status::OK();
}

//---------------------------------------------------------------------------------------------------------------------

Result<RunInfoTableReader> make_run_info_table_reader(
    std::shared_ptr<arrow::io::RandomAccessFile> const & input,
    arrow::MemoryPool * pool)
{
    arrow::ipc::IpcReadOptions options;
    options.memory_pool = pool;

    ARROW_ASSIGN_OR_RAISE(auto reader, arrow::ipc::RecordBatchFileReader::Open(input, options));

    auto read_metadata_key_values = reader->schema()->metadata();
    if (!read_metadata_key_values) {
        return Status::IOError("Missing metadata on run info table schema");
    }
    ARROW_ASSIGN_OR_RAISE(
        auto read_metadata, read_schema_key_value_metadata(read_metadata_key_values));
    ARROW_ASSIGN_OR_RAISE(
        auto field_locations, read_run_info_table_schema(read_metadata, reader->schema()));

    return RunInfoTableReader(
        {input}, std::move(reader), field_locations, std::move(read_metadata), pool);
}

}  // namespace pod5


================================================
FILE: c++/pod5_format/run_info_table_reader.h
================================================
#pragma once

#include "pod5_format/pod5_format_export.h"
#include "pod5_format/read_table_utils.h"
#include "pod5_format/result.h"
#include "pod5_format/run_info_table_schema.h"
#include "pod5_format/schema_metadata.h"
#include "pod5_format/table_reader.h"
#include "pod5_format/types.h"

#include <arrow/io/type_fwd.h>
#include <gsl/gsl-lite.hpp>

#include <mutex>
#include <unordered_map>

namespace arrow {
class Schema;

namespace io {
class RandomAccessFile;
}

namespace ipc {
class RecordBatchFileReader;
}
}  // namespace arrow

namespace pod5 {

struct RunInfoTableRecordColumns {
    // V0 Fields
    std::shared_ptr<arrow::StringArray> acquisition_id;
    std::shared_ptr<arrow::TimestampArray> acquisition_start_time;
    std::shared_ptr<arrow::Int16Array> adc_max;
    std::shared_ptr<arrow::Int16Array> adc_min;
    std::shared_ptr<arrow::MapArray> context_tags;
    std::shared_ptr<arrow::StringArray> experiment_name;
    std::shared_ptr<arrow::StringArray> flow_cell_id;
    std::shared_ptr<arrow::StringArray> flow_cell_product_code;
    std::shared_ptr<arrow::StringArray> protocol_name;
    std::shared_ptr<arrow::StringArray> protocol_run_id;
    std::shared_ptr<arrow::TimestampArray> protocol_start_time;
    std::shared_ptr<arrow::StringArray> sample_id;
    std::shared_ptr<arrow::UInt16Array> sample_rate;
    std::shared_ptr<arrow::StringArray> sequencing_kit;
    std::shared_ptr<arrow::StringArray> sequencer_position;
    std::shared_ptr<arrow::StringArray> sequencer_position_type;
    std::shared_ptr<arrow::StringArray> software;
    std::shared_ptr<arrow::StringArray> system_name;
    std::shared_ptr<arrow::StringArray> system_type;
    std::shared_ptr<arrow::MapArray> tracking_id;

    TableSpecVersion table_version;
};

class POD5_FORMAT_EXPORT RunInfoTableRecordBatch : public TableRecordBatch {
public:
    RunInfoTableRecordBatch(
        std::shared_ptr<arrow::RecordBatch> && batch,
        std::shared_ptr<RunInfoTableSchemaDescription const> const & field_locations);
    RunInfoTableRecordBatch(RunInfoTableRecordBatch &&);
    RunInfoTableRecordBatch & operator=(RunInfoTableRecordBatch &&);

    Result<RunInfoTableRecordColumns> columns() const;

private:
    std::shared_ptr<RunInfoTableSchemaDescription const> m_field_locations;
};

class POD5_FORMAT_EXPORT RunInfoTableReader : public TableReader {
public:
    RunInfoTableReader(
        std::shared_ptr<void> && input_source,
        std::shared_ptr<arrow::ipc::RecordBatchFileReader> && reader,
        std::shared_ptr<RunInfoTableSchemaDescription const> const & field_locations,
        SchemaMetadataDescription && schema_metadata,
        arrow::MemoryPool * pool);

    RunInfoTableReader(RunInfoTableReader && other);
    RunInfoTableReader & operator=(RunInfoTableReader && other);

    Result<RunInfoTableRecordBatch> read_record_batch(std::size_t i) const;

    Result<std::shared_ptr<RunInfoData const>> find_run_info(
        std::string const & acquisition_id) const;

    Result<std::shared_ptr<RunInfoData const>> get_run_info(std::size_t index) const;
    Result<std::size_t> get_run_info_count() const;

private:
    Result<std::shared_ptr<RunInfoData const>> load_run_info_from_batch(
        RunInfoTableRecordBatch const & batch,
        std::size_t batch_index,
        std::size_t global_index) const;
    arrow::Status prepare_run_infos_vector() const;

    std::shared_ptr<RunInfoTableSchemaDescription const> m_field_locations;
    mutable std::mutex m_batch_get_mutex;
    mutable std::unordered_map<std::string, std::shared_ptr<RunInfoData const>> m_run_info_lookup;
    mutable std::vector<std::shared_ptr<RunInfoData const>> m_run_infos;
    mutable std::mutex m_run_info_lookup_mutex;
};

POD5_FORMAT_EXPORT Result<RunInfoTableReader> make_run_info_table_reader(
    std::shared_ptr<arrow::io::RandomAccessFile> const & sink,
    arrow::MemoryPool * pool);

}  // namespace pod5


================================================
FILE: c++/pod5_format/run_info_table_schema.cpp
================================================
#include "pod5_format/run_info_table_schema.h"

#include "pod5_format/schema_metadata.h"
#include "pod5_format/types.h"

namespace pod5 {

RunInfoTableSchemaDescription::RunInfoTableSchemaDescription()
: SchemaDescriptionBase(RunInfoTableSpecVersion::latest())
// V0 Fields
, acquisition_id(this, "acquisition_id", arrow::utf8(), RunInfoTableSpecVersion::v0())
, acquisition_start_time(
      this,
      "acquisition_start_time",
      arrow::timestamp(arrow::TimeUnit::MILLI, "UTC"),
      RunInfoTableSpecVersion::v0())
, adc_max(this, "adc_max", arrow::int16(), RunInfoTableSpecVersion::v0())
, adc_min(this, "adc_min", arrow::int16(), RunInfoTableSpecVersion::v0())
, context_tags(
      this,
      "context_tags",
      arrow::map(arrow::utf8(), arrow::utf8()),
      RunInfoTableSpecVersion::v0())
, experiment_name(this, "experiment_name", arrow::utf8(), RunInfoTableSpecVersion::v0())
, flow_cell_id(this, "flow_cell_id", arrow::utf8(), RunInfoTableSpecVersion::v0())
, flow_cell_product_code(
      this,
      "flow_cell_product_code",
      arrow::utf8(),
      RunInfoTableSpecVersion::v0())
, protocol_name(this, "protocol_name", arrow::utf8(), RunInfoTableSpecVersion::v0())
, protocol_run_id(this, "protocol_run_id", arrow::utf8(), RunInfoTableSpecVersion::v0())
, protocol_start_time(
      this,
      "protocol_start_time",
      arrow::timestamp(arrow::TimeUnit::MILLI, "UTC"),
      RunInfoTableSpecVersion::v0())
, sample_id(this, "sample_id", arrow::utf8(), RunInfoTableSpecVersion::v0())
, sample_rate(this, "sample_rate", arrow::uint16(), RunInfoTableSpecVersion::v0())
, sequencing_kit(this, "sequencing_kit", arrow::utf8(), RunInfoTableSpecVersion::v0())
, sequencer_position(this, "sequencer_position", arrow::utf8(), RunInfoTableSpecVersion::v0())
, sequencer_position_type(
      this,
      "sequencer_position_type",
      arrow::utf8(),
      RunInfoTableSpecVersion::v0())
, software(this, "software", arrow::utf8(), RunInfoTableSpecVersion::v0())
, system_name(this, "system_name", arrow::utf8(), RunInfoTableSpecVersion::v0())
, system_type(this, "system_type", arrow::utf8(), RunInfoTableSpecVersion::v0())
, tracking_id(
      this,
      "tracking_id",
      arrow::map(arrow::utf8(), arrow::utf8()),
      RunInfoTableSpecVersion::v0())
{
}

TableSpecVersion RunInfoTableSchemaDescription::table_version_from_file_version(
    Version file_version) const
{
    return RunInfoTableSpecVersion::latest();
}

Result<std::shared_ptr<RunInfoTableSchemaDescription const>> read_run_info_table_schema(
    SchemaMetadataDescription const & schema_metadata,
    std::shared_ptr<arrow::Schema> const & schema)
{
    auto result = std::make_shared<RunInfoTableSchemaDescription>();
    ARROW_RETURN_NOT_OK(
        RunInfoTableSchemaDescription::read_schema(result, schema_metadata, schema));

    return result;
}

}  // namespace pod5


================================================
FILE: c++/pod5_format/run_info_table_schema.h
================================================
#pragma once

#include "pod5_format/pod5_format_export.h"
#include "pod5_format/result.h"
#include "pod5_format/schema_utils.h"
#include "pod5_format/tuple_utils.h"
#include "pod5_format/types.h"

#include <memory>
#include <tuple>
#include <vector>

namespace arrow {
class KeyValueMetadata;
class Schema;
class DataType;
class StructType;
}  // namespace arrow

namespace pod5 {

class RunInfoTableSpecVersion {
public:
    static TableSpecVersion v0() { return TableSpecVersion::first_version(); }

    static TableSpecVersion latest() { return v0(); }
};

class RunInfoTableSchemaDescription : public SchemaDescriptionBase {
public:
    RunInfoTableSchemaDescription();

    RunInfoTableSchemaDescription(RunInfoTableSchemaDescription const &) = delete;
    RunInfoTableSchemaDescription & operator=(RunInfoTableSchemaDescription const &) = delete;

    TableSpecVersion table_version_from_file_version(Version file_version) const override;

    Field<0, arrow::StringArray> acquisition_id;
    Field<1, arrow::TimestampArray> acquisition_start_time;
    Field<2, arrow::Int16Array> adc_max;
    Field<3, arrow::Int16Array> adc_min;
    Field<4, arrow::MapArray> context_tags;
    Field<5, arrow::StringArray> experiment_name;
    Field<6, arrow::StringArray> flow_cell_id;
    Field<7, arrow::StringArray> flow_cell_product_code;
    Field<8, arrow::StringArray> protocol_name;
    Field<9, arrow::StringArray> protocol_run_id;
    Field<10, arrow::TimestampArray> protocol_start_time;
    Field<11, arrow::StringArray> sample_id;
    Field<12, arrow::UInt16Array> sample_rate;
    Field<13, arrow::StringArray> sequencing_kit;
    Field<14, arrow::StringArray> sequencer_position;
    Field<15, arrow::StringArray> sequencer_position_type;
    Field<16, arrow::StringArray> software;
    Field<17, arrow::StringArray> system_name;
    Field<18, arrow::StringArray> system_type;
    Field<19, arrow::MapArray> tracking_id;

    // Field Builders only for fields we write in newly generated files.
    // Should not include fields which are removed in the latest version:
    using FieldBuilders = FieldBuilder<
        // V0 fields
        decltype(acquisition_id),
        decltype(acquisition_start_time),
        decltype(adc_max),
        decltype(adc_min),
        decltype(context_tags),
        decltype(experiment_name),
        decltype(flow_cell_id),
        decltype(flow_cell_product_code),
        decltype(protocol_name),
        decltype(protocol_run_id),
        decltype(protocol_start_time),
        decltype(sample_id),
        decltype(sample_rate),
        decltype(sequencing_kit),
        decltype(sequencer_position),
        decltype(sequencer_position_type),
        decltype(software),
        decltype(system_name),
        decltype(system_type),
        decltype(tracking_id)>;
};

POD5_FORMAT_EXPORT Result<std::shared_ptr<RunInfoTableSchemaDescription const>>
read_run_info_table_schema(
    SchemaMetadataDescription const & schema_metadata,
    std::shared_ptr<arrow::Schema> const &);

}  // namespace pod5


================================================
FILE: c++/pod5_format/run_info_table_writer.cpp
================================================
#include "pod5_format/run_info_table_writer.h"

#include "pod5_format/file_output_stream.h"
#include "pod5_format/internal/tracing/tracing.h"
#include "pod5_format/read_table_utils.h"

#include <arrow/extension_type.h>
#include <arrow/ipc/writer.h>
#include <arrow/record_batch.h>
#include <arrow/type.h>
#include <arrow/util/compression.h>

namespace pod5 {

RunInfoTableWriter::RunInfoTableWriter(
    std::shared_ptr<arrow::ipc::RecordBatchWriter> && writer,
    std::shared_ptr<arrow::Schema> && schema,
    std::shared_ptr<RunInfoTableSchemaDescription> const & field_locations,
    std::shared_ptr<FileOutputStream> const & output_stream,
    std::size_t table_batch_size,
    arrow::MemoryPool * pool)
: m_schema(schema)
, m_field_locations(field_locations)
, m_output_stream{output_stream}
, m_table_batch_size(table_batch_size)
, m_writer(std::move(writer))
, m_field_builders(m_field_locations, pool)
{
}

RunInfoTableWriter::RunInfoTableWriter(RunInfoTableWriter && other) = default;
RunInfoTableWriter & RunInfoTableWriter::operator=(RunInfoTableWriter &&) = default;

RunInfoTableWriter::~RunInfoTableWriter()
{
    if (m_writer) {
        (void)close();
    }
}

Result<std::size_t> RunInfoTableWriter::add_run_info(RunInfoData const & run_info_data)
{
    POD5_TRACE_FUNCTION();
    if (!m_writer) {
        return Status::IOError("Writer terminated");
    }

    ARROW_RETURN_NOT_OK(reserve_rows());

    auto row_id = m_written_batched_row_count + m_current_batch_row_count;
    ARROW_RETURN_NOT_OK(m_field_builders.append(
        // V0 Fields
        run_info_data.acquisition_id,
        run_info_data.acquisition_start_time,
        run_info_data.adc_max,
        run_info_data.adc_min,
        run_info_data.context_tags,
        run_info_data.experiment_name,
        run_info_data.flow_cell_id,
        run_info_data.flow_cell_product_code,
        run_info_data.protocol_name,
        run_info_data.protocol_run_id,
        run_info_data.protocol_start_time,
        run_info_data.sample_id,
        run_info_data.sample_rate,
        run_info_data.sequencing_kit,
        run_info_data.sequencer_position,
        run_info_data.sequencer_position_type,
        run_info_data.software,
        run_info_data.system_name,
        run_info_data.system_type,
        run_info_data.tracking_id));

    ++m_current_batch_row_count;

    if (m_current_batch_row_count >= m_table_batch_size) {
        ARROW_RETURN_NOT_OK(write_batch());
    }
    return row_id;
}

Status RunInfoTableWriter::close()
{
    // Check for already closed
    if (!m_writer) {
        return Status::OK();
    }

    ARROW_RETURN_NOT_OK(write_batch());
    ARROW_RETURN_NOT_OK(m_writer->Close());
    m_writer = nullptr;
    return Status::OK();
}

Status RunInfoTableWriter::write_batch(arrow::RecordBatch const & record_batch)
{
    ARROW_RETURN_NOT_OK(m_writer->WriteRecordBatch(record_batch));
    return m_output_stream->batch_complete();
}

Status RunInfoTableWriter::write_batch()
{
    POD5_TRACE_FUNCTION();
    if (m_current_batch_row_count == 0) {
        return Status::OK();
    }

    if (!m_writer) {
        return Status::IOError("Writer terminated");
    }

    ARROW_ASSIGN_OR_RAISE(auto columns, m_field_builders.finish_columns());

    auto const record_batch =
        arrow::RecordBatch::Make(m_schema, m_current_batch_row_count, std::move(columns));

    m_written_batched_row_count += m_current_batch_row_count;
    m_current_batch_row_count = 0;

    ARROW_RETURN_NOT_OK(m_writer->WriteRecordBatch(*record_batch));
    return m_output_stream->batch_complete();
}

Status RunInfoTableWriter::reserve_rows()
{
    // Only reserve if we have not already reserved (at the start of a batch)
    if (m_current_batch_row_count > 0) {
        return arrow::Status::OK();
    }

    return m_field_builders.reserve(m_table_batch_size);
}

Result<RunInfoTableWriter> make_run_info_table_writer(
    std::shared_ptr<FileOutputStream> const & sink,
    std::shared_ptr<arrow::KeyValueMetadata const> const & metadata,
    std::size_t table_batch_size,
    arrow::MemoryPool * pool)
{
    auto field_locations = std::make_shared<RunInfoTableSchemaDescription>();
    auto schema = field_locations->make_writer_schema(metadata);

    arrow::ipc::IpcWriteOptions options;
    options.memory_pool = pool;

    ARROW_ASSIGN_OR_RAISE(auto writer, arrow::ipc::MakeFileWriter(sink, schema, options, metadata));

    auto run_info_table_writer = RunInfoTableWriter(
        std::move(writer), std::move(schema), field_locations, sink, table_batch_size, pool);

    return run_info_table_writer;
}

}  // namespace pod5


================================================
FILE: c++/pod5_format/run_info_table_writer.h
================================================
#pragma once

#include "pod5_format/pod5_format_export.h"
#include "pod5_format/result.h"
#include "pod5_format/run_info_table_schema.h"
#include "pod5_format/schema_field_builder.h"

#include <arrow/array/builder_dict.h>
#include <arrow/io/type_fwd.h>

namespace arrow {
class Schema;

namespace ipc {
class RecordBatchWriter;
}
}  // namespace arrow

namespace pod5 {

class FileOutputStream;
class RunInfoData;

class POD5_FORMAT_EXPORT RunInfoTableWriter {
public:
    RunInfoTableWriter(
        std::shared_ptr<arrow::ipc::RecordBatchWriter> && writer,
        std::shared_ptr<arrow::Schema> && schema,
        std::shared_ptr<RunInfoTableSchemaDescription> const & field_locations,
        std::shared_ptr<FileOutputStream> const & output_stream,
        std::size_t table_batch_size,
        arrow::MemoryPool * pool);
    RunInfoTableWriter(RunInfoTableWriter &&);
    RunInfoTableWriter & operator=(RunInfoTableWriter &&);
    RunInfoTableWriter(RunInfoTableWriter const &) = delete;
    RunInfoTableWriter & operator=(RunInfoTableWriter const &) = delete;
    ~RunInfoTableWriter();

    /// \brief Add a run info to the table, adding to the current batch.
    /// \param run_info_data The run info data to add.
    /// \returns The row index of the inserted read, or a status on failure.
    Result<std::size_t> add_run_info(RunInfoData const & run_info_data);

    /// \brief Close this writer, signaling no further data will be written to the writer.
    Status close();

    /// \brief Reserve space for future row writes, called automatically when a flush occurs.
    Status reserve_rows();

    /// \brief Find the schema for the table
    std::shared_ptr<arrow::Schema> const & schema() const { return m_schema; }

    /// \brief Flush passed data into the writer as a record batch.
    Status write_batch(arrow::RecordBatch const &);

private:
    /// \brief Flush buffered data into the writer as a record batch.
    Status write_batch();

    std::shared_ptr<arrow::Schema> m_schema;
    std::shared_ptr<RunInfoTableSchemaDescription> m_field_locations;
    std::shared_ptr<FileOutputStream> m_output_stream;
    std::size_t m_table_batch_size;

    std::shared_ptr<arrow::ipc::RecordBatchWriter> m_writer;

    RunInfoTableSchemaDescription::FieldBuilders m_field_builders;

    std::size_t m_written_batched_row_count = 0;
    std::size_t m_current_batch_row_count = 0;
};

/// \brief Make a new writer for a read table.
/// \param sink Sink to be used for output of the table.
/// \param metadata Metadata to be applied to the table schema.
/// \param table_batch_size The size of each batch written for the table.
/// \param pool Pool to be used for building table in memory.
/// \returns The writer for the new table.
POD5_FORMAT_EXPORT Result<RunInfoTableWriter> make_run_info_table_writer(
    std::shared_ptr<FileOutputStream> const & sink,
    std::shared_ptr<arrow::KeyValueMetadata const> const & metadata,
    std::size_t table_batch_size,
    arrow::MemoryPool * pool);

}  // namespace pod5


================================================
FILE: c++/pod5_format/schema_field_builder.h
================================================
#pragma once

#include "pod5_format/dictionary_writer.h"
#include "pod5_format/read_table_schema.h"

#include <arrow/array/builder_binary.h>
#include <arrow/array/builder_nested.h>
#include <arrow/array/builder_primitive.h>

namespace pod5 {

class DictionaryWriter;

namespace detail {
template <typename ArrayType>
class BuilderHelper;
template <typename ArrayType, typename ElementArrayType>
class ListBuilderHelper;

template <>
class BuilderHelper<UuidArray> : public arrow::FixedSizeBinaryBuilder {
public:
    BuilderHelper(std::shared_ptr<arrow::DataType> const & uuid_type, arrow::MemoryPool * pool)
    : arrow::FixedSizeBinaryBuilder(find_storage_type(uuid_type), pool)
    {
        assert(byte_width() == 16);
    }

    static std::shared_ptr<arrow::DataType> find_storage_type(
        std::shared_ptr<arrow::DataType> const & uuid_type)
    {
        assert(uuid_type->id() == arrow::Type::EXTENSION);
        auto const & uuid_extension = static_cast<arrow::ExtensionType const &>(*uuid_type);
        return uuid_extension.storage_type();
    }

    arrow::Status Append(Uuid const & uuid)
    {
        return static_cast<arrow::FixedSizeBinaryBuilder *>(this)->Append(uuid.data());
    }
};

template <>
class BuilderHelper<arrow::FloatArray> : public arrow::FloatBuilder {
public:
    BuilderHelper(std::shared_ptr<arrow::DataType> const &, arrow::MemoryPool * pool)
    : arrow::FloatBuilder(pool)
    {
    }
};

template <>
class BuilderHelper<arrow::UInt8Array> : public arrow::UInt8Builder {
public:
    BuilderHelper(std::shared_ptr<arrow::DataType> const &, arrow::MemoryPool * pool)
    : arrow::UInt8Builder(pool)
    {
    }
};

template <>
class BuilderHelper<arrow::UInt16Array> : public arrow::UInt16Builder {
public:
    BuilderHelper(std::shared_ptr<arrow::DataType> const &, arrow::MemoryPool * pool)
    : arrow::UInt16Builder(pool)
    {
    }
};

template <>
class BuilderHelper<arrow::Int16Array> : public arrow::Int16Builder {
public:
    BuilderHelper(std::shared_ptr<arrow::DataType> const &, arrow::MemoryPool * pool)
    : arrow::Int16Builder(pool)
    {
    }
};

template <>
class BuilderHelper<arrow::UInt32Array> : public arrow::UInt32Builder {
public:
    BuilderHelper(std::shared_ptr<arrow::DataType> const &, arrow::MemoryPool * pool)
    : arrow::UInt32Builder(pool)
    {
    }
};

template <>
class BuilderHelper<arrow::UInt64Array> : public arrow::UInt64Builder {
public:
    BuilderHelper(std::shared_ptr<arrow::DataType> const &, arrow::MemoryPool * pool)
    : arrow::UInt64Builder(pool)
    {
    }
};

template <>
class BuilderHelper<arrow::BooleanArray> : public arrow::BooleanBuilder {
public:
    BuilderHelper(std::shared_ptr<arrow::DataType> const &, arrow::MemoryPool * pool)
    : arrow::BooleanBuilder(pool)
    {
    }
};

template <>
class BuilderHelper<arrow::NumericArray<arrow::TimestampType>> : public arrow::TimestampBuilder {
public:
    BuilderHelper(std::shared_ptr<arrow::DataType> const & type, arrow::MemoryPool * pool)
    : arrow::TimestampBuilder(type, pool)
    {
    }
};

template <>
class BuilderHelper<arrow::StringArray> : public arrow::StringBuilder {
public:
    BuilderHelper(std::shared_ptr<arrow::DataType> const &, arrow::MemoryPool * pool)
    : arrow::StringBuilder(pool)
    {
    }
};

template <>
class BuilderHelper<arrow::MapArray> {
public:
    BuilderHelper(std::shared_ptr<arrow::DataType> const &, arrow::MemoryPool * pool)
    : m_key_builder(std::make_shared<arrow::StringBuilder>(pool))
    , m_item_builder(std::make_shared<arrow::StringBuilder>(pool))
    , m_map_builder(pool, m_key_builder, m_item_builder)
    {
    }

    arrow::Status Finish(std::shared_ptr<arrow::Array> * dest)
    {
        return m_map_builder.Finish(dest);
    }

    arrow::Status Reserve(std::size_t rows) { return m_map_builder.Reserve(rows); }

    arrow::Status Append(std::vector<std::pair<std::string, std::string>> const & items)
    {
        ARROW_RETURN_NOT_OK(m_map_builder.Append());  // start new slot
        for (auto const & pair : items) {
            ARROW_RETURN_NOT_OK(m_key_builder->Append(pair.first));
            ARROW_RETURN_NOT_OK(m_item_builder->Append(pair.second));
        }
        return arrow::Status::OK();
    }

private:
    std::shared_ptr<arrow::StringBuilder> m_key_builder;
    std::shared_ptr<arrow::StringBuilder> m_item_builder;
    arrow::MapBuilder m_map_builder;
};

template <>
class BuilderHelper<arrow::DictionaryArray> : public arrow::Int16Builder {
public:
    BuilderHelper(std::shared_ptr<arrow::DataType> const &, arrow::MemoryPool * pool)
    : arrow::Int16Builder(pool)
    {
    }

    void set_dict_writer(std::shared_ptr<DictionaryWriter> const & writer)
    {
        m_dict_writer = writer;
    }

    arrow::Status Finish(std::shared_ptr<arrow::Array> * dest)
    {
        arrow::Int16Builder * index_builder = this;
        ARROW_ASSIGN_OR_RAISE(auto indices, index_builder->Finish());
        ARROW_ASSIGN_OR_RAISE(*dest, m_dict_writer->build_dictionary_array(indices));
        return arrow::Status::OK();
    }

private:
    std::shared_ptr<DictionaryWriter> m_dict_writer;
};

template <typename ElementArrayType>
class ListBuilderHelper<arrow::ListArray, ElementArrayType> {
public:
    ListBuilderHelper(std::shared_ptr<arrow::DataType> const &, arrow::MemoryPool * pool)
    : m_array_builder(std::make_shared<BuilderHelper<ElementArrayType>>(nullptr, pool))
    , m_builder(std::make_unique<arrow::ListBuilder>(pool, m_array_builder))
    {
    }

    arrow::Status Reserve(std::size_t rows)
    {
        ARROW_RETURN_NOT_OK(m_builder->Reserve(rows));
        return m_array_builder->Reserve(rows);
    }

    arrow::Status Finish(std::shared_ptr<arrow::Array> * dest) { return m_builder->Finish(dest); }

    template <typename Items>
    arrow::Status Append(Items const & items)
    {
        ARROW_RETURN_NOT_OK(m_builder->Append());  // start new slot
        return m_array_builder->AppendValues(items.data(), items.size());
    }

private:
    std::shared_ptr<BuilderHelper<ElementArrayType>> m_array_builder;
    std::unique_ptr<arrow::ListBuilder> m_builder;
};

}  // namespace detail

template <typename... Args>
class FieldBuilder {
public:
    using BuilderTuple = std::tuple<typename Args::BuilderType...>;

    template <typename SchamaDescription>
    FieldBuilder(std::shared_ptr<SchamaDescription> const & desc_base, arrow::MemoryPool * pool)
    : m_builders(
          typename Args::BuilderType(
              desc_base->fields()[Args::WriteIndex::value]->datatype(),
              pool)...)
    {
    }

    template <typename FieldType>
    std::tuple_element_t<FieldType::WriteIndex::value, BuilderTuple> & get_builder(FieldType)
    {
        return std::get<FieldType::WriteIndex::value>(m_builders);
    }

    arrow::Result<std::vector<std::shared_ptr<arrow::Array>>> finish_columns()
    {
        arrow::Status result;
        std::vector<std::shared_ptr<arrow::Array>> columns;
        columns.resize(std::tuple_size<decltype(m_builders)>::value);

        detail::for_each_in_tuple(m_builders, [&](auto & element, std::size_t index) {
            if (result.ok()) {
                result = element.Finish(&columns[index]);
                assert(columns[index] || !result.ok());
            }
        });

        if (!result.ok()) {
            return result;
        }

        return columns;
    }

    arrow::Status reserve(std::size_t row_count)
    {
        arrow::Status result;
        detail::for_each_in_tuple(m_builders, [&](auto & element, std::size_t _) {
            if (result.ok()) {
                result = element.Reserve(row_count);
            }
        });
        return result;
    }

    template <typename... AppendArgs>
    arrow::Status append(AppendArgs const &... args)
    {
        auto args_list = std::forward_as_tuple(args...);

        arrow::Status result;
        for_each_in_tuple_zipped(
            m_builders, args_list, [&](auto & builder, auto & item, std::size_t _) {
                if (result.ok()) {
                    result = builder.Append(item);
                }
            });
        return result;
    }

private:
    BuilderTuple m_builders;
};

}  // namespace pod5


================================================
FILE: c++/pod5_format/schema_metadata.cpp
================================================
#include "pod5_format/schema_metadata.h"

#include "pod5_format/uuid.h"
#include "pod5_format/version.h"

#include <arrow/util/key_value_metadata.h>

namespace pod5 {

Result<Version> parse_version_number(std::string const & ver)
{
    std::uint16_t components[3];
    std::size_t component_index = 0;
    std::size_t last_char_index = 0;
    std::size_t char_index = 0;

    auto parse_component = [&](std::size_t last_char_index, std::size_t char_index) {
        auto const component_str =
            std::string(ver.data() + last_char_index, ver.data() + char_index);

        std::size_t pos = 0;
        int val = std::stoi(component_str, &pos);

        if (pos != (char_index - last_char_index)) {
            throw std::runtime_error("Invalid remaining characters after version number");
        }

        return val;
    };

    try {
        while (char_index < ver.size()) {
            if (ver[char_index] == '.') {
                if (component_index > 3) {
                    return Status::Invalid("Invalid component count");
                }
                components[component_index] = parse_component(last_char_index, char_index);

                last_char_index = char_index + 1;
                component_index += 1;
            }
            char_index += 1;
        }

        // extract the final component
        if (component_index != 2) {
            return Status::Invalid("Invalid component count");
        }
        components[2] = parse_component(last_char_index, char_index);
    } catch (std::exception const & e) {
        return Status::Invalid(e.what());
    }

    return Version{components[0], components[1], components[2]};
}

Version current_build_version_number()
{
    return Version(Pod5MajorVersion, Pod5MinorVersion, Pod5RevVersion);
}

Result<std::shared_ptr<arrow::KeyValueMetadata const>> make_schema_key_value_metadata(
    SchemaMetadataDescription const & schema_metadata)
{
    if (schema_metadata.writing_software.empty()) {
        return Status::Invalid("Expected writing_software to be specified for metadata");
    }

    if (schema_metadata.writing_pod5_version == Version{}) {
        return Status::Invalid("Expected writing_pod5_version to be specified for metadata");
    }

    if (schema_metadata.file_identifier == Uuid{}) {
        return Status::Invalid("Expected file_identifier to be specified for metadata");
    }

    return arrow::KeyValueMetadata::Make(
        {"MINKNOW:file_identifier", "MINKNOW:software", "MINKNOW:pod5_version"},
        {to_string(schema_metadata.file_identifier),
         schema_metadata.writing_software,
         schema_metadata.writing_pod5_version.to_string()});
}

Result<SchemaMetadataDescription> read_schema_key_value_metadata(
    std::shared_ptr<arrow::KeyValueMetadata const> const & key_value_metadata)
{
    ARROW_ASSIGN_OR_RAISE(
        auto file_identifier_str, key_value_metadata->Get("MINKNOW:file_identifier"));
    ARROW_ASSIGN_OR_RAISE(auto software_str, key_value_metadata->Get("MINKNOW:software"));
    ARROW_ASSIGN_OR_RAISE(auto pod5_version_str, key_value_metadata->Get("MINKNOW:pod5_version"));
    ARROW_ASSIGN_OR_RAISE(auto pod5_version, parse_version_number(pod5_version_str));

    auto const file_identifier = Uuid::from_string(file_identifier_str);
    if (!file_identifier) {
        return Status::IOError(
            "Schema file_identifier metadata not uuid form: '", file_identifier_str, "'");
    }

    return SchemaMetadataDescription{*file_identifier, software_str, pod5_version};
}

}  // namespace pod5


================================================
FILE: c++/pod5_format/schema_metadata.h
================================================
#pragma once

#include "pod5_format/pod5_format_export.h"
#include "pod5_format/result.h"
#include "pod5_format/uuid.h"

#include <memory>
#include <string>
#include <tuple>

namespace arrow {
class KeyValueMetadata;
}

namespace pod5 {

class Version {
public:
    Version() : m_version(0, 0, 0) {}

    Version(std::uint16_t major, std::uint16_t minor, std::uint16_t revision)
    : m_version(major, minor, revision)
    {
    }

    bool operator<(Version const & in) const { return m_version < in.m_version; }

    bool operator>(Version const & in) const { return m_version > in.m_version; }

    bool operator==(Version const & in) const { return m_version == in.m_version; }

    bool operator!=(Version const & in) const { return m_version != in.m_version; }

    std::string to_string() const
    {
        return std::to_string(std::get<0>(m_version)) + "." + std::to_string(std::get<1>(m_version))
               + "." + std::to_string(std::get<2>(m_version));
    }

    std::uint16_t major_version() const { return std::get<0>(m_version); }

    std::uint16_t minor_version() const { return std::get<1>(m_version); }

    std::uint16_t revision_version() const { return std::get<2>(m_version); }

private:
    std::tuple<std::uint16_t, std::uint16_t, std::uint16_t> m_version;
};

POD5_FORMAT_EXPORT Result<Version> parse_version_number(std::string const & ver);
POD5_FORMAT_EXPORT Version current_build_version_number();

struct SchemaMetadataDescription {
    Uuid file_identifier;
    std::string writing_software;
    Version writing_pod5_version;
};

POD5_FORMAT_EXPORT Result<std::shared_ptr<arrow::KeyValueMetadata const>>
make_schema_key_value_metadata(SchemaMetadataDescription const & schema_metadata);

POD5_FORMAT_EXPORT Result<SchemaMetadataDescription> read_schema_key_value_metadata(
    std::shared_ptr<arrow::KeyValueMetadata const> const & key_value_metadata);

}  // namespace pod5


================================================
FILE: c++/pod5_format/schema_utils.cpp
================================================
#include "pod5_format/schema_utils.h"

namespace pod5 {

/// \brief Make a new schema for a read table to be written (will only contain fields which are written in the latest version).
/// \param metadata Metadata to be applied to the schema.
/// \returns The schema for a read table.
std::shared_ptr<arrow::Schema> SchemaDescriptionBase::make_writer_schema(
    std::shared_ptr<arrow::KeyValueMetadata const> const & metadata) const
{
    auto const latest_version = latest_table_version();
    arrow::FieldVector writer_fields;
    for (auto & field : fields()) {
        if (field->removed_table_spec_version() > latest_version) {
            writer_fields.emplace_back(arrow::field(field->name(), field->datatype()));
        }
    }
    return arrow::schema(writer_fields, metadata);
}

Status SchemaDescriptionBase::read_schema(
    std::shared_ptr<SchemaDescriptionBase> dest_schema,
    SchemaMetadataDescription const & schema_metadata,
    std::shared_ptr<arrow::Schema> const & schema)
{
    dest_schema->m_table_spec_version =
        dest_schema->table_version_from_file_version(schema_metadata.writing_pod5_version);

    for (auto & field : dest_schema->fields()) {
        if (dest_schema->table_version() < field->added_table_spec_version()
            || dest_schema->table_version() >= field->removed_table_spec_version())
        {
            continue;
        }

        auto const & datatype = field->datatype();
        int field_index = 0;
        if (datatype->id() == arrow::Type::DICTIONARY) {
            auto const & dict_type = static_cast<arrow::DictionaryType const &>(*datatype);
            if (dict_type.value_type()->id() == arrow::Type::STRUCT) {
                std::shared_ptr<arrow::StructType> value_type;
                ARROW_ASSIGN_OR_RAISE(
                    field_index,
                    find_dict_field(schema, field->name().c_str(), arrow::int16(), &value_type));
            } else {
                std::shared_ptr<arrow::StringType> value_type;
                ARROW_ASSIGN_OR_RAISE(
                    field_index,
                    find_dict_field(schema, field->name().c_str(), arrow::int16(), &value_type));
            }
        } else {
            ARROW_ASSIGN_OR_RAISE(field_index, find_field(schema, field->name().c_str(), datatype));
        }
        field->set_field_index(field_index);
    }

    return arrow::Status::OK();
}

}  // namespace pod5


================================================
FILE: c++/pod5_format/schema_utils.h
================================================
#pragma once

#include "pod5_format/schema_metadata.h"

#include <arrow/record_batch.h>
#include <arrow/type.h>

namespace pod5 {

inline arrow::Result<int> find_field_untyped(
    std::shared_ptr<arrow::Schema> const & schema,
    char const * name)
{
    auto const field_idx = schema->GetFieldIndex(name);
    if (field_idx == -1) {
        return Status::TypeError("Schema missing field '", name, "'");
    }

    return field_idx;
}

inline arrow::Result<int> find_field(
    std::shared_ptr<arrow::Schema> const & schema,
    char const * name,
    std::shared_ptr<arrow::DataType> const & expected_data_type)
{
    ARROW_ASSIGN_OR_RAISE(auto field_idx, find_field_untyped(schema, name));

    auto const field = schema->field(field_idx);
    auto const type = field->type();

    if (!type->Equals(expected_data_type)) {
        return Status::TypeError(
            "Schema field '", name, "' is incorrect type: '", type->name(), "'");
    }

    return field_idx;
}

template <typename ValueType>
inline arrow::Result<int> find_dict_field(
    std::shared_ptr<arrow::Schema> const & schema,
    char const * name,
    std::shared_ptr<arrow::DataType> const & index_type,
    std::shared_ptr<ValueType> * value_type)
{
    ARROW_ASSIGN_OR_RAISE(auto field_idx, find_field_untyped(schema, name));

    auto const field = schema->field(field_idx);
    auto const type = std::dynamic_pointer_cast<arrow::DictionaryType>(field->type());
    if (!type) {
        return Status::TypeError("Dictionary field was unexpected type: ", field->type()->name());
    }

    if (!type->index_type()->Equals(index_type)) {
        return Status::TypeError(
            "Schema field '", name, "' is incorrect type: '", type->name(), "'");
    }

    *value_type = std::dynamic_pointer_cast<ValueType>(type->value_type());
    if (!*value_type) {
        return Status::TypeError(
            "Dictionary value was unexpected type: ", type->value_type()->name());
    }
    return field_idx;
}

template <typename FieldType>
std::shared_ptr<typename FieldType::ArrayType> find_column(
    std::shared_ptr<arrow::RecordBatch> const & batch,
    FieldType const & field)
{
    auto field_base = batch->column(field.field_index());
    return std::static_pointer_cast<typename FieldType::ArrayType>(std::move(field_base));
}

class FieldBase;

enum class SpecialFieldValues : int {
    InvalidField = -1,
};

class TableSpecVersion {
public:
    using UnderlyingType = std::uint8_t;

    TableSpecVersion() : m_version(std::numeric_limits<UnderlyingType>::max()) {}

    static TableSpecVersion first_version() { return TableSpecVersion(0); }

    static TableSpecVersion unknown_version() { return TableSpecVersion(); }

    static TableSpecVersion at_version(UnderlyingType version) { return TableSpecVersion(version); }

    UnderlyingType as_int() const { return m_version; }

    bool operator<(TableSpecVersion const & other) const { return m_version < other.m_version; }

    bool operator>(TableSpecVersion const & other) const { return m_version > other.m_version; }

    bool operator<=(TableSpecVersion const & other) const { return m_version <= other.m_version; }

    bool operator>=(TableSpecVersion const & other) const { return m_version >= other.m_version; }

private:
    TableSpecVersion(UnderlyingType version) : m_version(version) {}

    UnderlyingType m_version;
};

class SchemaDescriptionBase {
public:
    SchemaDescriptionBase(TableSpecVersion version) : m_table_spec_version(version) {}

    virtual ~SchemaDescriptionBase() = default;

    void add_field(FieldBase * field) { m_fields.push_back(field); }

    std::vector<FieldBase *> const & fields() { return m_fields; }

    std::vector<FieldBase const *> const & fields() const
    {
        return reinterpret_cast<std::vector<FieldBase const *> const &>(m_fields);
    }

    TableSpecVersion latest_table_version() const
    {
        return table_version_from_file_version(current_build_version_number());
    }

    virtual TableSpecVersion table_version_from_file_version(Version file_version) const = 0;

    TableSpecVersion table_version() const { return m_table_spec_version; }

    /// \brief Make a new schema for a read table to be written (will only contain fields which are written in the latest version).
    /// \param metadata Metadata to be applied to the schema.
    /// \returns The schema for a read table.
    std::shared_ptr<arrow::Schema> make_writer_schema(
        std::shared_ptr<arrow::KeyValueMetadata const> const & metadata) const;

    static Status read_schema(
        std::shared_ptr<SchemaDescriptionBase> dest_schema,
        SchemaMetadataDescription const & schema_metadata,
        std::shared_ptr<arrow::Schema> const & schema);

private:
    std::vector<FieldBase *> m_fields;
    TableSpecVersion m_table_spec_version;
};

namespace detail {
template <typename ArrayType>
class BuilderHelper;
template <typename ArrayType, typename ElementArrayType>
class ListBuilderHelper;
}  // namespace detail

class FieldBase {
public:
    FieldBase(
        SchemaDescriptionBase * owner,
        int field_index,
        std::string name,
        std::shared_ptr<arrow::DataType> const & datatype,
        TableSpecVersion added_table_spec_version = TableSpecVersion::first_version(),
        TableSpecVersion removed_table_spec_version = TableSpecVersion::unknown_version())
    : m_name(name)
    , m_datatype(datatype)
    , m_field_index(field_index)
    , m_added_table_spec_version(added_table_spec_version)
    , m_removed_table_spec_version(removed_table_spec_version)
    {
        owner->add_field(this);
    }

    std::string const & name() const { return m_name; }

    std::shared_ptr<arrow::DataType> const & datatype() const { return m_datatype; }

    int field_index() const { return m_field_index; }

    TableSpecVersion added_table_spec_version() const { return m_added_table_spec_version; }

    TableSpecVersion removed_table_spec_version() const { return m_removed_table_spec_version; }

    void set_field_index(int index) { m_field_index = index; }

    bool found_field() const { return m_field_index != (int)SpecialFieldValues::InvalidField; }

private:
    std::string m_name;
    std::shared_ptr<arrow::DataType> m_datatype;
    int m_field_index = (int)SpecialFieldValues::InvalidField;
    TableSpecVersion m_added_table_spec_version;
    TableSpecVersion m_removed_table_spec_version;
};

template <int WriteIndex_, typename ArrayType_>
struct Field : public FieldBase {
    using WriteIndex = std::integral_constant<int, WriteIndex_>;
    using ArrayType = ArrayType_;
    using BuilderType = detail::BuilderHelper<ArrayType>;

    Field(
        SchemaDescriptionBase * owner,
        std::string name,
        std::shared_ptr<arrow::DataType> const & datatype,
        TableSpecVersion added_table_spec_version = TableSpecVersion::first_version(),
        TableSpecVersion removed_table_spec_version = TableSpecVersion::unknown_version())
    : FieldBase(
          owner,
          WriteIndex::value,
          name,
          datatype,
          added_table_spec_version,
          removed_table_spec_version)
    {
    }
};

template <int WriteIndex_, typename ArrayType_, typename ElementType_>
struct ListField : public Field<WriteIndex_, ArrayType_> {
    using ElementType = ElementType_;
    using BuilderType = detail::ListBuilderHelper<ArrayType_, ElementType>;

    ListField(
        SchemaDescriptionBase * owner,
        std::string name,
        std::shared_ptr<arrow::DataType> const & datatype,
        TableSpecVersion added_table_spec_version = TableSpecVersion::first_version(),
        TableSpecVersion removed_table_spec_version = TableSpecVersion::unknown_version())
    : Field<WriteIndex_, ArrayType_>(
          owner,
          name,
          datatype,
          added_table_spec_version,
          removed_table_spec_version)
    {
    }
};

template <typename... Args>
class FieldBuilder;

}  // namespace pod5


================================================
FILE: c++/pod5_format/signal_builder.h
================================================
#pragma once

#include "pod5_format/expandable_buffer.h"
#include "pod5_format/signal_compression.h"
#include "pod5_format/signal_table_utils.h"
#include "pod5_format/types.h"

#include <arrow/array/builder_nested.h>
#include <arrow/array/builder_primitive.h>
#include <arrow/array/util.h>

#include <variant>

namespace pod5 {

struct UncompressedSignalBuilder {
    std::shared_ptr<arrow::Int16Builder> signal_data_builder;
    std::unique_ptr<arrow::LargeListBuilder> signal_builder;
};

struct VbzSignalBuilder {
    ExpandableBuffer<std::int64_t> offset_values;
    ExpandableBuffer<std::uint8_t> data_values;
};

using SignalBuilderVariant = std::variant<UncompressedSignalBuilder, VbzSignalBuilder>;

inline arrow::Result<SignalBuilderVariant> make_signal_builder(
    SignalType compression_type,
    arrow::MemoryPool * pool)
{
    if (compression_type == SignalType::UncompressedSignal) {
        auto signal_array_builder = std::make_shared<arrow::Int16Builder>(pool);
        return UncompressedSignalBuilder{
            signal_array_builder,
            std::make_unique<arrow::LargeListBuilder>(pool, signal_array_builder),
        };
    } else {
        VbzSignalBuilder vbz_builder;
        ARROW_RETURN_NOT_OK(vbz_builder.offset_values.init_buffer(pool));
        ARROW_RETURN_NOT_OK(vbz_builder.data_values.init_buffer(pool));
        return vbz_builder;
    }
}

namespace visitors {
class reserve_rows {
public:
    reserve_rows(std::size_t row_count, std::size_t approx_read_samples)
    : m_row_count(row_count)
    , m_approx_read_samples(approx_read_samples)
    {
    }

    Status operator()(UncompressedSignalBuilder & builder) const
    {
        ARROW_RETURN_NOT_OK(builder.signal_builder->Reserve(m_row_count));
        return builder.signal_data_builder->Reserve(m_row_count * m_approx_read_samples);
    }

    Status operator()(VbzSignalBuilder & builder) const
    {
        ARROW_RETURN_NOT_OK(builder.offset_values.reserve(m_row_count + 1));
        return builder.data_values.reserve(m_row_count * m_approx_read_samples);
    }

    std::size_t m_row_count;
    std::size_t m_approx_read_samples;
};

class append_pre_compressed_signal {
public:
    append_pre_compressed_signal(gsl::span<std::uint8_t const> const & signal) : m_signal(signal) {}

    Status operator()(UncompressedSignalBuilder & builder) const
    {
        ARROW_RETURN_NOT_OK(builder.signal_builder->Append());  // start new slot

        auto as_uncompressed = m_signal.as_span<std::int16_t const>();
        return builder.signal_data_builder->AppendValues(
            as_uncompressed.data(), as_uncompressed.size());
    }

    Status operator()(VbzSignalBuilder & builder) const
    {
        ARROW_RETURN_NOT_OK(builder.offset_values.append(builder.data_values.size()));
        return builder.data_values.append_array(m_signal);
    }

    gsl::span<std::uint8_t const> m_signal;
};

class append_signal {
public:
    append_signal(gsl::span<std::int16_t const> const & signal, arrow::MemoryPool * pool)
    : m_signal(signal)
    , m_pool(pool)
    {
    }

    Status operator()(UncompressedSignalBuilder & builder) const
    {
        ARROW_RETURN_NOT_OK(builder.signal_builder->Append());  // start new slot
        return builder.signal_data_builder->AppendValues(m_signal.data(), m_signal.size());
    }

    Status operator()(VbzSignalBuilder & builder) const
    {
        ARROW_RETURN_NOT_OK(builder.offset_values.append(builder.data_values.size()));

        ARROW_ASSIGN_OR_RAISE(auto const max_size, compressed_signal_max_size(m_signal.size()));

        // Compress the signal in place into our buffer.
        return builder.data_values.append(
            max_size, [&](gsl::span<std::uint8_t> buffer) -> arrow::Result<std::size_t> {
                return compress_signal(m_signal, m_pool, buffer);
            });
    }

    gsl::span<std::int16_t const> m_signal;
    arrow::MemoryPool * m_pool;
};

class finish_column {
public:
    finish_column(std::shared_ptr<arrow::Array> * dest) : m_dest(dest) {}

    Status operator()(UncompressedSignalBuilder & builder) const
    {
        return builder.signal_builder->Finish(m_dest);
    }

    Status operator()(VbzSignalBuilder & builder) const
    {
        auto offsets_copy = builder.offset_values;
        ARROW_RETURN_NOT_OK(builder.offset_values.clear());

        auto const value_data = builder.data_values.get_buffer();
        ARROW_RETURN_NOT_OK(builder.data_values.clear());

        auto const length = offsets_copy.size();

        // Write final offset (values length)
        ARROW_RETURN_NOT_OK(offsets_copy.append(value_data->size()));
        auto const offsets = offsets_copy.get_buffer();

        std::shared_ptr<arrow::Buffer> null_bitmap;

        *m_dest = arrow::MakeArray(
            arrow::ArrayData::Make(vbz_signal(), length, {null_bitmap, offsets, value_data}, 0, 0));

        return arrow::Status::OK();
    }

    std::shared_ptr<arrow::Array> * m_dest;
};

}  // namespace visitors
}  // namespace pod5


================================================
FILE: c++/pod5_format/signal_compression.cpp
================================================
#include "pod5_format/signal_compression.h"

#include "pod5_format/svb16/decode.hpp"
#include "pod5_format/svb16/encode.hpp"

#include <arrow/buffer.h>
#include <arrow/util/io_util.h>
#include <zstd.h>

#include <cassert>
#include <limits>

namespace pod5 {

namespace {

// SVB is designed around 32 bit sizes, so that's the maximum uncompressed samples allowed.
constexpr std::size_t max_uncompressed_samples = std::numeric_limits<std::uint32_t>::max();

class DecompressContext {
    struct DCtxDeleter {
        void operator()(ZSTD_DCtx * ctx) { ZSTD_freeDCtx(ctx); }
    };

    std::unique_ptr<ZSTD_DCtx, DCtxDeleter> m_context;

public:
    DecompressContext() { m_context.reset(ZSTD_createDCtx()); }

    ZSTD_DCtx * get() { return m_context.get(); }

    explicit operator bool() const { return static_cast<bool>(m_context); }
};

}  // namespace

arrow::Result<std::size_t> compressed_signal_max_size(std::size_t sample_count)
{
    if (sample_count > max_uncompressed_samples) {
        return arrow::Status::Invalid(
            sample_count, " samples exceeds max of ", max_uncompressed_samples);
    }

    auto const max_svb_size = svb16_max_encoded_length(sample_count);
    auto const zstd_compressed_max_size = ZSTD_compressBound(max_svb_size);
    if (ZSTD_isError(zstd_compressed_max_size)) {
        return pod5::Status::Invalid(
            sample_count,
            " samples exceeds zstd limit: (",
            zstd_compressed_max_size,
            " ",
            ZSTD_getErrorName(zstd_compressed_max_size),
            ")");
    }

    return zstd_compressed_max_size;
}

arrow::Result<std::size_t> compress_signal(
    gsl::span<SampleType const> samples,
    arrow::MemoryPool * pool,
    gsl::span<std::uint8_t> destination)
{
    std::size_t const sample_count = samples.size();
    if (sample_count > max_uncompressed_samples) {
        return arrow::Status::Invalid(
            sample_count, " samples exceeds max of ", max_uncompressed_samples);
    }

    // First compress the data using svb:
    auto const max_size = svb16_max_encoded_length(sample_count);
    ARROW_ASSIGN_OR_RAISE(auto intermediate, arrow::AllocateResizableBuffer(max_size, pool));

    static constexpr bool UseDelta = true;
    static constexpr bool UseZigzag = true;
    auto const encoded_count = svb16::encode<SampleType, UseDelta, UseZigzag>(
        samples.data(), intermediate->mutable_data(), sample_count);
    ARROW_RETURN_NOT_OK(intermediate->Resize(encoded_count));

    // Now compress the svb data using zstd:
    size_t const zstd_compressed_max_size = ZSTD_compressBound(intermediate->size());
    if (ZSTD_isError(zstd_compressed_max_size)) {
        return pod5::Status::Invalid(
            "Failed to find zstd max size for data: (",
            zstd_compressed_max_size,
            " ",
            ZSTD_getErrorName(zstd_compressed_max_size),
            ")");
    }

    /* Compress.
     * If you are doing many compressions, you may want to reuse the context.
     * See the multiple_simple_compression.c example.
     */
    size_t const compressed_size = ZSTD_compress(
        destination.data(), destination.size(), intermediate->data(), intermediate->size(), 1);
    if (ZSTD_isError(compressed_size)) {
        return pod5::Status::Invalid(
            "Failed to compress data: (",
            compressed_size,
            " ",
            ZSTD_getErrorName(compressed_size),
            ")");
    }
    return compressed_size;
}

arrow::Result<std::shared_ptr<arrow::Buffer>> compress_signal(
    gsl::span<SampleType const> samples,
    arrow::MemoryPool * pool)
{
    ARROW_ASSIGN_OR_RAISE(
        std::size_t const sample_count, compressed_signal_max_size(samples.size()));

    ARROW_ASSIGN_OR_RAISE(
        std::shared_ptr<arrow::ResizableBuffer> out,
        arrow::AllocateResizableBuffer(sample_count, pool));

    ARROW_ASSIGN_OR_RAISE(
        auto final_size,
        compress_signal(samples, pool, gsl::make_span(out->mutable_data(), out->size())));

    ARROW_RETURN_NOT_OK(out->Resize(final_size));
    return out;
}

arrow::Status decompress_signal(
    gsl::span<std::uint8_t const> compressed_bytes,
    arrow::MemoryPool * pool,
    gsl::span<std::int16_t> destination)
{
    // Check that we could have compressed this size.
    ARROW_ASSIGN_OR_RAISE(
        std::size_t const max_compressed_size, compressed_signal_max_size(destination.size()));
    if (compressed_bytes.size() > max_compressed_size) {
        return pod5::Status::Invalid(
            "Input data corrupt: compressed input size (",
            compressed_bytes.size(),
            ") exceeds max compressed output size (",
            max_compressed_size,
            ")");
    }

    // Find out how big zstd thinks the data is.
    unsigned long long const decompressed_zstd_size =
        ZSTD_getFrameContentSize(compressed_bytes.data(), compressed_bytes.size());
    if (ZSTD_isError(decompressed_zstd_size)) {
        return pod5::Status::Invalid(
            "Input data not compressed by zstd: (",
            decompressed_zstd_size,
            " ",
            ZSTD_getErrorName(decompressed_zstd_size),
            ")");
    }

    // Documentation of |ZSTD_getFrameContentSize| explicitly states that we should bounds check this:
    //     *   note 5 : If source is untrusted, decompressed size could be wrong or intentionally modified.
    //     *            Always ensure return value fits within application's authorized limits.
    //     *            Each application can set its own limits.
    std::size_t const max_svb16_compressed_size = svb16_max_encoded_length(destination.size());
    if (decompressed_zstd_size > max_svb16_compressed_size) {
        return arrow::Status::Invalid(
            "Input data corrupt: claimed size (",
            decompressed_zstd_size,
            ") exceeds max compressed output size (",
            max_svb16_compressed_size,
            ")");
    }

    // Check that we have enough memory to decompress.
    // Note: this will return 0 on unsupported platforms, so we skip it there.
    std::int64_t const system_memory = arrow::internal::GetTotalMemoryBytes();
    assert(system_memory > 0);
    if (system_memory > 0 && decompressed_zstd_size >= static_cast<std::size_t>(system_memory)) {
        return arrow::Status::OutOfMemory(
            "Not enough system memory (",
            system_memory,
            ") to decompress file (",
            decompressed_zstd_size,
            ")");
    }

    if (POD5_ENABLE_FUZZERS && decompressed_zstd_size > 1'000'000) {
        return arrow::Status::Invalid("Skipping huge sizes when fuzzing");
    }

    thread_local DecompressContext decompress_context;
    if (!decompress_context) {
        return arrow::Status::OutOfMemory("Failed to create zstd decompress context");
    }

    // Decompress the data using zstd.
    auto const allocation_padding = svb16::decode_input_buffer_padding_byte_count();
    ARROW_ASSIGN_OR_RAISE(
        auto intermediate,
        arrow::AllocateResizableBuffer(decompressed_zstd_size + allocation_padding, pool));
    size_t const decompress_res = ZSTD_decompressDCtx(
        decompress_context.get(),
        intermediate->mutable_data(),
        intermediate->size(),
        compressed_bytes.data(),
        compressed_bytes.size());
    if (ZSTD_isError(decompress_res)) {
        return pod5::Status::Invalid(
            "Input data failed to decompress using zstd: (",
            decompress_res,
            " ",
            ZSTD_getErrorName(decompress_res),
            ")");
    }

    auto const svb16_compressed_data_with_padding =
        gsl::make_span(intermediate->data(), intermediate->size());
    auto const svb16_compressed_data_no_padding =
        svb16_compressed_data_with_padding.subspan(0, decompressed_zstd_size);

    // Validate the data.
    if (!svb16::validate(svb16_compressed_data_no_padding, destination.size())) {
        return pod5::Status::Invalid("Compressed signal data is corrupt");
    }

    // Now decompress the data using svb:
    static constexpr bool UseDelta = true;
    static constexpr bool UseZigzag = true;
    auto consumed_count = svb16::decode<SampleType, UseDelta, UseZigzag>(
        destination, svb16_compressed_data_with_padding);
    if (consumed_count != decompressed_zstd_size) {
        return pod5::Status::Invalid("Remaining data at end of signal buffer");
    }

    return pod5::Status::OK();
}

arrow::Result<std::shared_ptr<arrow::Buffer>> decompress_signal(
    gsl::span<std::uint8_t const> compressed_bytes,
    std::uint32_t samples_count,
    arrow::MemoryPool * pool)
{
    ARROW_ASSIGN_OR_RAISE(
        std::shared_ptr<arrow::ResizableBuffer> out,
        arrow::AllocateResizableBuffer(samples_count * sizeof(SampleType), pool));

    auto signal_span = gsl::make_span(out->mutable_data(), out->size()).as_span<std::int16_t>();

    ARROW_RETURN_NOT_OK(decompress_signal(compressed_bytes, pool, signal_span));
    return out;
}
}  // namespace pod5


================================================
FILE: c++/pod5_format/signal_compression.h
================================================
#pragma once

#include "pod5_format/pod5_format_export.h"
#include "pod5_format/result.h"

#include <gsl/gsl-lite.hpp>

namespace arrow {
class MemoryPool;
class Buffer;
}  // namespace arrow

namespace pod5 {

using SampleType = std::int16_t;

POD5_FORMAT_EXPORT arrow::Result<std::size_t> compressed_signal_max_size(std::size_t sample_count);

POD5_FORMAT_EXPORT arrow::Result<std::size_t> compress_signal(
    gsl::span<SampleType const> samples,
    arrow::MemoryPool * pool,
    gsl::span<std::uint8_t> destination);

POD5_FORMAT_EXPORT arrow::Result<std::shared_ptr<arrow::Buffer>> compress_signal(
    gsl::span<SampleType const> samples,
    arrow::MemoryPool * pool);

POD5_FORMAT_EXPORT arrow::Result<std::shared_ptr<arrow::Buffer>> decompress_signal(
    gsl::span<std::uint8_t const> compressed_bytes,
    std::uint32_t samples_count,
    arrow::MemoryPool * pool);

POD5_FORMAT_EXPORT arrow::Status decompress_signal(
    gsl::span<std::uint8_t const> compressed_bytes,
    arrow::MemoryPool * pool,
    gsl::span<std::int16_t> destination);

}  // namespace pod5


================================================
FILE: c++/pod5_format/signal_table_reader.cpp
================================================
#include "pod5_format/signal_table_reader.h"

#include "pod5_format/schema_metadata.h"
#include "pod5_format/signal_compression.h"
#include "pod5_format/table_reader.h"

#include <arrow/array/array_nested.h>
#include <arrow/array/array_primitive.h>
#include <arrow/ipc/reader.h>

#include <iostream>

namespace pod5 {

struct SignalTableReaderCacheCleaner {
    static void make_space_in_table_batches(
        std::unordered_map<std::size_t, SignalTableReader::CachedItem> & cached_batches)
    {
        std::vector<std::pair<std::size_t, SignalTableReader::AccessIndex>> access_ordered_data;
        access_ordered_data.reserve(cached_batches.size());

        for (auto item : cached_batches) {
            access_ordered_data.emplace_back(
                std::make_pair(item.first, item.second.last_access_index));
        }
        std::sort(
            access_ordered_data.begin(),
            access_ordered_data.end(),
            [](auto const & a, auto const & b) { return a.second < b.second; });

        // Clear about 20% of the cache to make space for further growth:
        auto const to_clear = std::max<std::size_t>(1, cached_batches.size() * 0.2f);
        for (std::size_t i = 0; i < to_clear; ++i) {
            auto const index_to_remove = access_ordered_data[i].first;
            cached_batches.erase(index_to_remove);
        }
    }
};

SignalTableRecordBatch::SignalTableRecordBatch(
    std::shared_ptr<arrow::RecordBatch> const & batch,
    SignalTableSchemaDescription field_locations,
    arrow::MemoryPool * pool)
: TableRecordBatch(batch)
, m_field_locations(field_locations)
, m_pool(pool)
{
}

std::shared_ptr<UuidArray> SignalTableRecordBatch::read_id_column() const
{
    return std::static_pointer_cast<UuidArray>(batch()->column(m_field_locations.read_id));
}

std::shared_ptr<arrow::LargeListArray> SignalTableRecordBatch::uncompressed_signal_column() const
{
    return std::static_pointer_cast<arrow::LargeListArray>(
        batch()->column(m_field_locations.signal));
}

std::shared_ptr<VbzSignalArray> SignalTableRecordBatch::vbz_signal_column() const
{
    return std::static_pointer_cast<VbzSignalArray>(batch()->column(m_field_locations.signal));
}

std::shared_ptr<arrow::UInt32Array> SignalTableRecordBatch::samples_column() const
{
    return std::static_pointer_cast<arrow::UInt32Array>(batch()->column(m_field_locations.samples));
}

Result<std::size_t> SignalTableRecordBatch::samples_byte_count(std::size_t row_index) const
{
    switch (m_field_locations.signal_type) {
    case SignalType::UncompressedSignal: {
        auto signal_column = uncompressed_signal_column();
        auto signal = signal_column->value_slice(row_index);
        return signal->length() * sizeof(std::int16_t);
    }
    case SignalType::VbzSignal: {
        auto signal_column = vbz_signal_column();
        auto signal_compressed = signal_column->Value(row_index);
        return signal_compressed.size();
    }
    }

    return pod5::Status::Invalid("Unknown signal type");
}

Status SignalTableRecordBatch::extract_signal_row(
    std::size_t row_index,
    gsl::span<std::int16_t> samples) const
{
    if (row_index >= num_rows()) {
        return pod5::Status::Invalid(
            "Queried signal row ",
            row_index,
            " is outside the available rows (",
            num_rows(),
            " in batch)");
    }

    auto sample_count = samples_column();
    auto samples_in_row = sample_count->Value(row_index);
    if (samples_in_row != samples.size()) {
        return pod5::Status::Invalid(
            "Unexpected size for sample array ", samples.size(), " expected ", samples_in_row);
    }

    switch (m_field_locations.signal_type) {
    case SignalType::UncompressedSignal: {
        auto signal_column = uncompressed_signal_column();
        auto signal =
            std::static_pointer_cast<arrow::Int16Array>(signal_column->value_slice(row_index));
        std::copy(signal->raw_values(), signal->raw_values() + signal->length(), samples.begin());
        return Status::OK();
    }
    case SignalType::VbzSignal: {
        auto signal_column = vbz_signal_column();
        auto signal_compressed = signal_column->Value(row_index);
        return pod5::decompress_signal(signal_compressed, m_pool, samples);
    }
    }

    return pod5::Status::Invalid("Unknown signal type");
}

Result<std::shared_ptr<arrow::Buffer>> SignalTableRecordBatch::extract_signal_row_inplace(
    std::size_t row_index) const
{
    if (row_index >= num_rows()) {
        return pod5::Status::Invalid(
            "Queried signal row ",
            row_index,
            " is outside the available rows (",
            num_rows(),
            " in batch)");
    }

    switch (m_field_locations.signal_type) {
    case SignalType::UncompressedSignal: {
        auto signal_column = uncompressed_signal_column();
        auto const value_slice =
            std::static_pointer_cast<arrow::Int16Array>(signal_column->value_slice(row_index));

        auto const element_size =
            sizeof(std::remove_reference<decltype(*signal_column)>::type::TypeClass);

        auto const values = value_slice->values();
        auto offset = signal_column->value_offset(row_index);
        auto length = signal_column->value_length(row_index);
        return arrow::SliceBuffer(values, offset * element_size, length * element_size);
    }
    case SignalType::VbzSignal: {
        auto signal_column = vbz_signal_column();
        return signal_column->ValueAsBuffer(row_index);
    }
    }

    return pod5::Status::Invalid("Unknown signal type");
}

//---------------------------------------------------------------------------------------------------------------------

SignalTableReader::SignalTableReader(
    std::shared_ptr<void> && input_source,
    std::shared_ptr<arrow::ipc::RecordBatchFileReader> && reader,
    SignalTableSchemaDescription field_locations,
    SchemaMetadataDescription && schema_metadata,
    std::size_t num_record_batches,
    std::size_t batch_size,
    std::size_t max_cached_table_batches,
    arrow::MemoryPool * pool)
: TableReader(std::move(input_source), std::move(reader), std::move(schema_metadata), pool)
, m_field_locations(field_locations)
, m_pool(pool)
, m_max_cached_table_batches(max_cached_table_batches)
, m_table_batches(num_record_batches)
, m_batch_size(batch_size)
{
}

SignalTableReader::SignalTableReader(SignalTableReader && other)
: TableReader(std::move(other))
, m_field_locations(std::move(other.m_field_locations))
, m_pool(other.m_pool)
, m_max_cached_table_batches(other.m_max_cached_table_batches)
, m_table_batches(std::move(other.m_table_batches))
, m_batch_size(other.m_batch_size)
{
}

SignalTableReader & SignalTableReader::operator=(SignalTableReader && other)
{
    m_field_locations = std::move(other.m_field_locations);
    m_pool = other.m_pool;
    m_max_cached_table_batches = other.m_max_cached_table_batches;
    m_batch_size = other.m_batch_size;
    m_table_batches = std::move(other.m_table_batches);
    static_cast<TableReader &>(*this) = std::move(static_cast<TableReader &>(other));
    return *this;
}

Result<SignalTableRecordBatch> SignalTableReader::read_record_batch(std::size_t i) const
{
    std::lock_guard<std::mutex> l(m_batch_get_mutex);
    if (m_last_read_record_batch_index == i) {
        return pod5::SignalTableRecordBatch{m_last_read_record_batch, m_field_locations, m_pool};
    }

    auto it = m_table_batches.find(i);
    if (it != m_table_batches.end()) {
        it->second.last_access_index = m_last_access_index++;
        return it->second.item;
    }

    // If limited in cached batches, then ensure we apply limit:
    if (m_max_cached_table_batches != 0 && m_table_batches.size() >= m_max_cached_table_batches) {
        SignalTableReaderCacheCleaner::make_space_in_table_batches(m_table_batches);
        assert(m_table_batches.size() < m_max_cached_table_batches);
    }

    ARROW_ASSIGN_OR_RAISE(m_last_read_record_batch, TableReader::ReadRecordBatch(i));
    m_last_read_record_batch_index = i;
    auto inserted = m_table_batches.emplace(
        i,
        CachedItem{
            pod5::SignalTableRecordBatch{m_last_read_record_batch, m_field_locations, m_pool},
            m_last_access_index++});
    return inserted.first->second.item;
}

Result<std::size_t> SignalTableReader::signal_batch_for_row_id(
    std::uint64_t row,
    std::size_t * batch_row) const
{
    if (m_batch_size == 0) {
        return Status::Invalid("Invalid row '", row, "' for file with zero signal rows.");
    }

    auto batch = row / m_batch_size;

    if (batch_row) {
        *batch_row = row - (batch * m_batch_size);
    }

    if (batch >= num_record_batches()) {
        return Status::Invalid("Row outside batch bounds");
    }

    return batch;
}

Result<std::size_t> SignalTableReader::extract_sample_count(
    gsl::span<std::uint64_t const> const & row_indices) const
{
    std::size_t sample_count = 0;
    for (auto const & signal_row : row_indices) {
        std::size_t batch_row = 0;
        ARROW_ASSIGN_OR_RAISE(
            auto const signal_batch_index, signal_batch_for_row_id(signal_row, &batch_row));

        ARROW_ASSIGN_OR_RAISE(auto const & signal_batch, read_record_batch(signal_batch_index));
        auto const & samples_column = signal_batch.samples_column();
        sample_count += samples_column->Value(batch_row);
    }
    return sample_count;
}

Status SignalTableReader::extract_samples(
    gsl::span<std::uint64_t const> const & row_indices,
    gsl::span<std::int16_t> const & output_samples) const
{
    std::size_t sample_count = 0;

    for (auto const & signal_row : row_indices) {
        std::size_t batch_row = 0;
        ARROW_ASSIGN_OR_RAISE(
            auto const signal_batch_index, signal_batch_for_row_id(signal_row, &batch_row));

        ARROW_ASSIGN_OR_RAISE(auto const & signal_batch, read_record_batch(signal_batch_index));
        auto const & samples_column = signal_batch.samples_column();
        auto const row_samples_count = samples_column->Value(batch_row);
        std::size_t const sample_start = sample_count;
        sample_count += row_samples_count;
        if (sample_count > output_samples.size()) {
            return Status::Invalid("Too few samples in input samples array");
        }

        ARROW_RETURN_NOT_OK(signal_batch.extract_signal_row(
            batch_row, output_samples.subspan(sample_start, row_samples_count)));
    }
    return Status::OK();
}

Result<std::vector<std::shared_ptr<arrow::Buffer>>> SignalTableReader::extract_samples_inplace(
    gsl::span<std::uint64_t const> const & row_indices,
    std::vector<std::uint32_t> & sample_count) const
{
    std::vector<std::shared_ptr<arrow::Buffer>> sample_buffers;

    for (auto const & signal_row : row_indices) {
        std::size_t batch_row = 0;
        ARROW_ASSIGN_OR_RAISE(
            auto const signal_batch_index, signal_batch_for_row_id(signal_row, &batch_row));

        ARROW_ASSIGN_OR_RAISE(auto const & signal_batch, read_record_batch(signal_batch_index));

        ARROW_ASSIGN_OR_RAISE(auto signal_data, signal_batch.extract_signal_row_inplace(batch_row));
        sample_buffers.emplace_back(std::move(signal_data));

        auto const & samples_column = signal_batch.samples_column();
        sample_count.push_back(samples_column->Value(batch_row));
    }
    return sample_buffers;
}

SignalType SignalTableReader::signal_type() const { return m_field_locations.signal_type; }

//---------------------------------------------------------------------------------------------------------------------
Result<SignalTableReader> make_signal_table_reader(
    std::shared_ptr<arrow::io::RandomAccessFile> const & input,
    std::size_t max_cached_table_batches,
    arrow::MemoryPool * pool)
{
    arrow::ipc::IpcReadOptions options;
    options.memory_pool = pool;

    ARROW_ASSIGN_OR_RAISE(auto reader, arrow::ipc::RecordBatchFileReader::Open(input, options));

    auto read_metadata_key_values = reader->schema()->metadata();
    if (!read_metadata_key_values) {
        return Status::IOError("Missing metadata on signal table schema");
    }
    ARROW_ASSIGN_OR_RAISE(
        auto read_metadata, read_schema_key_value_metadata(read_metadata_key_values));
    ARROW_ASSIGN_OR_RAISE(auto field_locations, read_signal_table_schema(reader->schema()));

    std::size_t const num_record_batches = reader->num_record_batches();
    std::size_t batch_size = 0;
    if (num_record_batches > 0) {
        ARROW_ASSIGN_OR_RAISE(auto const batch_zero, ReadRecordBatchAndValidate(*reader, 0));
        batch_size = batch_zero->num_rows();
    }

    return SignalTableReader(
        {input},
        std::move(reader),
        field_locations,
        std::move(read_metadata),
        num_record_batches,
        batch_size,
        max_cached_table_batches,
        pool);
}

}  // namespace pod5


================================================
FILE: c++/pod5_format/signal_table_reader.h
================================================
#pragma once

#include "pod5_format/pod5_format_export.h"
#include "pod5_format/result.h"
#include "pod5_format/schema_metadata.h"
#include "pod5_format/signal_table_schema.h"
#include "pod5_format/table_reader.h"
#include "pod5_format/types.h"

#include <arrow/io/type_fwd.h>
#include <gsl/gsl-lite.hpp>

#include <atomic>
#include <mutex>
#include <unordered_map>

namespace arrow {
class Schema;

namespace io {
class RandomAccessFile;
}

namespace ipc {
class RecordBatchFileReader;
}
}  // namespace arrow

namespace pod5 {

struct SignalTableReaderCacheCleaner;

class POD5_FORMAT_EXPORT SignalTableRecordBatch : public TableRecordBatch {
public:
    SignalTableRecordBatch(
        std::shared_ptr<arrow::RecordBatch> const & batch,
        SignalTableSchemaDescription field_locations,
        arrow::MemoryPool * pool);

    std::shared_ptr<UuidArray> read_id_column() const;
    std::shared_ptr<arrow::LargeListArray> uncompressed_signal_column() const;
    std::shared_ptr<VbzSignalArray> vbz_signal_column() const;
    std::shared_ptr<arrow::UInt32Array> samples_column() const;

    Result<std::size_t> samples_byte_count(std::size_t row_index) const;

    /// \brief Extract a row of sample data into [samples], decompressing if required.
    Status extract_signal_row(std::size_t row_index, gsl::span<std::int16_t> samples) const;
    Result<std::shared_ptr<arrow::Buffer>> extract_signal_row_inplace(std::size_t row_index) const;

private:
    SignalTableSchemaDescription m_field_locations;
    arrow::MemoryPool * m_pool;
};

class POD5_FORMAT_EXPORT SignalTableReader : public TableReader {
public:
    SignalTableReader(
        std::shared_ptr<void> && input_source,
        std::shared_ptr<arrow::ipc::RecordBatchFileReader> && reader,
        SignalTableSchemaDescription field_locations,
        SchemaMetadataDescription && schema_metadata,
        std::size_t num_record_batches,
        std::size_t batch_size,
        std::size_t max_cached_table_batches,
        arrow::MemoryPool * pool);

    SignalTableReader(SignalTableReader &&);
    SignalTableReader & operator=(SignalTableReader &&);

    Result<SignalTableRecordBatch> read_record_batch(std::size_t i) const;

    Result<std::size_t> signal_batch_for_row_id(std::uint64_t row, std::size_t * batch_row) const;

    /// \brief Find the number of samples in a given list of rows.
    /// \param row_indices      The rows to query for sample ount.
    /// \returns The sum of all sample counts on input rows.
    Result<std::size_t> extract_sample_count(
        gsl::span<std::uint64_t const> const & row_indices) const;

    /// \brief Extract the samples for a list of rows.
    /// \param row_indices      The rows to query for samples.
    /// \param output_samples   The output samples from the rows. Data in the vector is cleared before appending.
    Status extract_samples(
        gsl::span<std::uint64_t const> const & row_indices,
        gsl::span<std::int16_t> const & output_samples) const;

    /// \brief Extract the samples as written in the arrow table for a list of rows.
    /// \param row_indices      The rows to query for samples.
    Result<std::vector<std::shared_ptr<arrow::Buffer>>> extract_samples_inplace(
        gsl::span<std::uint64_t const> const & row_indices,
        std::vector<std::uint32_t> & sample_count) const;

    /// \brief Find the signal type of this writer
    SignalType signal_type() const;

private:
    SignalTableSchemaDescription m_field_locations;
    arrow::MemoryPool * m_pool;
    std::size_t m_max_cached_table_batches;

    mutable std::size_t m_last_read_record_batch_index = -1;
    mutable std::shared_ptr<arrow::RecordBatch> m_last_read_record_batch;

    mutable std::mutex m_batch_get_mutex;
    using AccessIndex = std::uint64_t;

    struct CachedItem {
        pod5::SignalTableRecordBatch item;
        AccessIndex last_access_index;
    };

    mutable std::unordered_map<std::size_t, CachedItem> m_table_batches;

    mutable AccessIndex m_last_access_index = 0;

    std::size_t m_batch_size;

    friend struct SignalTableReaderCacheCleaner;
};

POD5_FORMAT_EXPORT Result<SignalTableReader> make_signal_table_reader(
    std::shared_ptr<arrow::io::RandomAccessFile> const & sink,
    std::size_t max_cached_table_batches,
    arrow::MemoryPool * pool);

}  // namespace pod5


================================================
FILE: c++/pod5_format/signal_table_schema.cpp
================================================
#include "pod5_format/signal_table_schema.h"

#include "pod5_format/schema_utils.h"
#include "pod5_format/types.h"

#include <arrow/type.h>

namespace pod5 {

std::shared_ptr<arrow::Schema> make_signal_table_schema(
    SignalType signal_type,
    std::shared_ptr<arrow::KeyValueMetadata const> const & metadata,
    SignalTableSchemaDescription * field_locations)
{
    auto const uuid_type = uuid();

    if (field_locations) {
        *field_locations = {};
        field_locations->signal_type = signal_type;
    }

    std::shared_ptr<arrow::DataType> signal_schema_type;
    switch (signal_type) {
    case SignalType::UncompressedSignal:
        signal_schema_type = arrow::large_list(arrow::int16());
        break;
    case SignalType::VbzSignal:
        signal_schema_type = vbz_signal();
        break;
    }

    return arrow::schema(
        {
            arrow::field("read_id", uuid_type),
            arrow::field("signal", signal_schema_type),
            arrow::field("samples", arrow::uint32()),
        },
        metadata);
}

Result<SignalTableSchemaDescription> read_signal_table_schema(
    std::shared_ptr<arrow::Schema> const & schema)
{
    ARROW_ASSIGN_OR_RAISE(auto read_id_field_idx, find_field(schema, "read_id", uuid()));
    ARROW_ASSIGN_OR_RAISE(auto samples_field_idx, find_field(schema, "samples", arrow::uint32()));

    ARROW_ASSIGN_OR_RAISE(auto signal_field_idx, find_field_untyped(schema, "signal"));
    SignalType signal_type = SignalType::UncompressedSignal;
    {
        auto const signal_field = schema->field(signal_field_idx);

        auto const signal_arrow_type = signal_field->type();
        if (signal_arrow_type->id() == arrow::Type::LARGE_LIST) {
            auto const & signal_list_field =
                static_cast<arrow::LargeListType const &>(*signal_arrow_type);
            if (signal_list_field.value_type()->id() != arrow::Type::INT16) {
                return Status::TypeError("Schema field 'signal' list value type is incorrect type");
            }
        } else if (signal_arrow_type->Equals(vbz_signal())) {
            signal_type = SignalType::VbzSignal;
        } else {
            return Status::TypeError(
                "Schema field 'signal' is incorrect type: '", signal_arrow_type->name(), "'");
        }
    }

    return SignalTableSchemaDescription{
        signal_type, read_id_field_idx, signal_field_idx, samples_field_idx};
}

}  // namespace pod5


================================================
FILE: c++/pod5_format/signal_table_schema.h
================================================
#pragma once

#include "pod5_format/pod5_format_export.h"
#include "pod5_format/result.h"
#include "pod5_format/signal_table_utils.h"

#include <memory>

namespace arrow {
class KeyValueMetadata;
class Schema;
}  // namespace arrow

namespace pod5 {

struct SignalTableSchemaDescription {
    SignalType signal_type;

    int read_id = 0;
    int signal = 1;
    int samples = 2;
};

/// \brief Make a new schema for a signal table.
/// \param signal_type The type of signal to use.
/// \param metadata Metadata to be applied to the schema.
/// \param field_locations [optional] The signal table field locations, for use when writing to the table.
/// \returns The schema for a signal table.
POD5_FORMAT_EXPORT std::shared_ptr<arrow::Schema> make_signal_table_schema(
    SignalType signal_type,
    std::shared_ptr<arrow::KeyValueMetadata const> const & metadata,
    SignalTableSchemaDescription * field_locations);

POD5_FORMAT_EXPORT Result<SignalTableSchemaDescription> read_signal_table_schema(
    std::shared_ptr<arrow::Schema> const &);

}  // namespace pod5


================================================
FILE: c++/pod5_format/signal_table_utils.h
================================================
#pragma once

namespace pod5 {

using SignalTableRowIndex = std::uint64_t;

enum class SignalType {
    UncompressedSignal,
    VbzSignal,
};

}  // namespace pod5


================================================
FILE: c++/pod5_format/signal_table_writer.cpp
================================================
#include "pod5_format/signal_table_writer.h"

#include "pod5_format/file_output_stream.h"
#include "pod5_format/internal/tracing/tracing.h"
#include "pod5_format/types.h"

#include <arrow/array/builder_binary.h>
#include <arrow/array/builder_nested.h>
#include <arrow/array/builder_primitive.h>
#include <arrow/array/util.h>
#include <arrow/extension_type.h>
#include <arrow/ipc/writer.h>
#include <arrow/record_batch.h>
#include <arrow/type.h>

namespace pod5 {

SignalTableWriter::SignalTableWriter(
    std::shared_ptr<arrow::ipc::RecordBatchWriter> && writer,
    std::shared_ptr<arrow::Schema> && schema,
    SignalBuilderVariant && signal_builder,
    SignalTableSchemaDescription const & field_locations,
    std::shared_ptr<FileOutputStream> const & output_stream,
    std::size_t table_batch_size,
    arrow::MemoryPool * pool)
: m_pool(pool)
, m_schema(schema)
, m_field_locations(field_locations)
, m_output_stream{output_stream}
, m_table_batch_size(table_batch_size)
, m_writer(std::move(writer))
, m_signal_builder(std::move(signal_builder))
{
    m_read_id_builder = make_read_id_builder(m_pool);
    m_samples_builder = std::make_unique<arrow::UInt32Builder>(m_pool);
}

SignalTableWriter::SignalTableWriter(SignalTableWriter && other) = default;
SignalTableWriter & SignalTableWriter::operator=(SignalTableWriter &&) = default;

SignalTableWriter::~SignalTableWriter()
{
    if (m_writer) {
        (void)close();
    }
}

Result<SignalTableRowIndex> SignalTableWriter::add_signal(
    Uuid const & read_id,
    gsl::span<std::int16_t const> const & signal)
{
    POD5_TRACE_FUNCTION();
    if (!m_writer) {
        return Status::IOError("Writer terminated");
    }

    ARROW_RETURN_NOT_OK(reserve_rows());

    auto row_id = m_written_batched_row_count + m_current_batch_row_count;
    ARROW_RETURN_NOT_OK(m_read_id_builder->Append(read_id.data()));

    ARROW_RETURN_NOT_OK(std::visit(visitors::append_signal{signal, m_pool}, m_signal_builder));

    ARROW_RETURN_NOT_OK(m_samples_builder->Append(signal.size()));
    ++m_current_batch_row_count;

    if (m_current_batch_row_count >= m_table_batch_size) {
        ARROW_RETURN_NOT_OK(write_batch());
    }

    return row_id;
}

Result<SignalTableRowIndex> SignalTableWriter::add_pre_compressed_signal(
    Uuid const & read_id,
    gsl::span<std::uint8_t const> const & signal,
    std::uint32_t sample_count)
{
    POD5_TRACE_FUNCTION();
    if (!m_writer) {
        return Status::IOError("Writer terminated");
    }

    ARROW_RETURN_NOT_OK(reserve_rows());

    auto row_id = m_written_batched_row_count + m_current_batch_row_count;
    ARROW_RETURN_NOT_OK(m_read_id_builder->Append(read_id.data()));

    ARROW_RETURN_NOT_OK(
        std::visit(visitors::append_pre_compressed_signal{signal}, m_signal_builder));

    ARROW_RETURN_NOT_OK(m_samples_builder->Append(sample_count));
    ++m_current_batch_row_count;

    if (m_current_batch_row_count >= m_table_batch_size) {
        ARROW_RETURN_NOT_OK(write_batch());
    }

    return row_id;
}

pod5::Result<std::pair<SignalTableRowIndex, SignalTableRowIndex>>
SignalTableWriter::add_signal_batch(
    std::size_t row_count,
    std::vector<std::shared_ptr<arrow::Array>> && columns,
    bool final_batch)
{
    POD5_TRACE_FUNCTION();
    if (!m_writer) {
        return Status::Invalid("Unable to write batches, writer is closed.");
    }

    if (m_current_batch_row_count != 0) {
        return Status::Invalid("Unable to write batches directly and using per read methods");
    }

    if (!final_batch && row_count != m_table_batch_size) {
        return Status::Invalid("Unable to write invalid sized signal batch to signal table");
    }

    auto const record_batch = arrow::RecordBatch::Make(m_schema, row_count, std::move(columns));
    ARROW_RETURN_NOT_OK(m_writer->WriteRecordBatch(*record_batch));
    if (final_batch) {
        ARROW_RETURN_NOT_OK(close());
    }

    auto first_row_id = m_written_batched_row_count;
    m_written_batched_row_count += row_count;
    return std::make_pair(first_row_id, m_written_batched_row_count);
}

Status SignalTableWriter::close()
{
    // Check for already closed
    if (!m_writer) {
        return Status::OK();
    }

    ARROW_RETURN_NOT_OK(write_batch());

    ARROW_RETURN_NOT_OK(m_writer->Close());
    m_writer = nullptr;
    return Status::OK();
}

SignalType SignalTableWriter::signal_type() const { return m_field_locations.signal_type; }

Status SignalTableWriter::write_batch(arrow::RecordBatch const & record_batch)
{
    ARROW_RETURN_NOT_OK(m_writer->WriteRecordBatch(record_batch));
    return m_output_stream->batch_complete();
}

Status SignalTableWriter::write_batch()
{
    POD5_TRACE_FUNCTION();
    if (m_current_batch_row_count == 0) {
        return Status::OK();
    }

    if (!m_writer) {
        return Status::IOError("Writer terminated");
    }

    std::vector<std::shared_ptr<arrow::Array>> columns{nullptr, nullptr, nullptr};
    ARROW_RETURN_NOT_OK(m_read_id_builder->Finish(&columns[m_field_locations.read_id]));

    ARROW_RETURN_NOT_OK(
        std::visit(visitors::finish_column{&columns[m_field_locations.signal]}, m_signal_builder));

    ARROW_RETURN_NOT_OK(m_samples_builder->Finish(&columns[m_field_locations.samples]));

    auto const record_batch =
        arrow::RecordBatch::Make(m_schema, m_current_batch_row_count, std::move(columns));
    m_written_batched_row_count += m_current_batch_row_count;
    m_current_batch_row_count = 0;

    ARROW_RETURN_NOT_OK(m_writer->WriteRecordBatch(*record_batch));
    return m_output_stream->batch_complete();
}

Status SignalTableWriter::reserve_rows()
{
    // Only reserve if we have not already reserved (at the start of a batch)
    if (m_current_batch_row_count > 0) {
        return arrow::Status::OK();
    }

    ARROW_RETURN_NOT_OK(m_read_id_builder->Reserve(m_table_batch_size));
    ARROW_RETURN_NOT_OK(m_samples_builder->Reserve(m_table_batch_size));

    static constexpr std::uint32_t APPROX_READ_SIZE = 102'400;

    return std::visit(
        visitors::reserve_rows{m_table_batch_size, APPROX_READ_SIZE}, m_signal_builder);
}

Result<SignalTableWriter> make_signal_table_writer(
    std::shared_ptr<FileOutputStream> const & sink,
    std::shared_ptr<arrow::KeyValueMetadata const> const & metadata,
    std::size_t table_batch_size,
    SignalType compression_type,
    arrow::MemoryPool * pool)
{
    SignalTableSchemaDescription field_locations;
    auto schema = make_signal_table_schema(compression_type, metadata, &field_locations);

    arrow::ipc::IpcWriteOptions options;
    options.memory_pool = pool;

    ARROW_ASSIGN_OR_RAISE(auto writer, arrow::ipc::MakeFileWriter(sink, schema, options, metadata));

    ARROW_ASSIGN_OR_RAISE(auto signal_builder, make_signal_builder(compression_type, pool));

    auto signal_table_writer = SignalTableWriter(
        std::move(writer),
        std::move(schema),
        std::move(signal_builder),
        field_locations,
        sink,
        table_batch_size,
        pool);

    return signal_table_writer;
}

}  // namespace pod5


================================================
FILE: c++/pod5_format/signal_table_writer.h
================================================
#pragma once

#include "pod5_format/pod5_format_export.h"
#include "pod5_format/result.h"
#include "pod5_format/signal_builder.h"
#include "pod5_format/signal_table_schema.h"
#include "pod5_format/uuid.h"

#include <arrow/io/type_fwd.h>
#include <gsl/gsl-lite.hpp>

namespace arrow {
class Schema;

namespace ipc {
class RecordBatchWriter;
}
}  // namespace arrow

namespace pod5 {

class FileOutputStream;

class POD5_FORMAT_EXPORT SignalTableWriter {
public:
    SignalTableWriter(
        std::shared_ptr<arrow::ipc::RecordBatchWriter> && writer,
        std::shared_ptr<arrow::Schema> && schema,
        SignalBuilderVariant && signal_builder,
        SignalTableSchemaDescription const & field_locations,
        std::shared_ptr<FileOutputStream> const & output_stream,
        std::size_t table_batch_size,
        arrow::MemoryPool * pool);
    SignalTableWriter(SignalTableWriter &&);
    SignalTableWriter & operator=(SignalTableWriter &&);
    SignalTableWriter(SignalTableWriter const &) = delete;
    SignalTableWriter & operator=(SignalTableWriter const &) = delete;
    ~SignalTableWriter();

    /// \brief Find the size of table batches for the signal table writer.
    std::size_t table_batch_size() const { return m_table_batch_size; }

    /// \brief Add a read to the signal table, adding to the current batch.
    /// \param read_id The read id for the read entry
    /// \param signal The signal for the read entry
    /// \returns The row index of the inserted signal, or a status on failure.
    Result<SignalTableRowIndex> add_signal(
        Uuid const & read_id,
        gsl::span<std::int16_t const> const & signal);

    /// \brief Add a pre-compressed read to the signal table, adding to the current batch.
    ///        The batch is not flushed to disk until #flush is called.
    ///
    ///        The user should call #compress_signal on *this* writer to compress the signal prior
    ///        to calling this method, to ensure the signal is compressed correctly for the table.
    ///
    /// \param read_id The read id for the read entry
    /// \param signal The signal for the read entry
    /// \returns The row index of the inserted signal, or a status on failure.
    Result<SignalTableRowIndex> add_pre_compressed_signal(
        Uuid const & read_id,
        gsl::span<std::uint8_t const> const & signal,
        std::uint32_t sample_count);

    pod5::Result<std::pair<SignalTableRowIndex, SignalTableRowIndex>> add_signal_batch(
        std::size_t row_count,
        std::vector<std::shared_ptr<arrow::Array>> && columns,
        bool final_batch);

    /// \brief Close this writer, signaling no further data will be written to the writer.
    Status close();

    /// \brief Find the signal type of this writer
    SignalType signal_type() const;

    /// \brief Reserve space for future row writes, called automatically when a flush occurs.
    Status reserve_rows();

    /// \brief Find the schema for the signal table
    std::shared_ptr<arrow::Schema> const & schema() const { return m_schema; }

    /// \brief Flush passed data into the writer as a record batch.
    Status write_batch(arrow::RecordBatch const &);

private:
    /// \brief Flush buffered data into the writer as a record batch.
    Status write_batch();

    arrow::MemoryPool * m_pool = nullptr;
    std::shared_ptr<arrow::Schema> m_schema;
    SignalTableSchemaDescription m_field_locations;
    std::shared_ptr<FileOutputStream> m_output_stream;
    std::size_t m_table_batch_size;

    std::shared_ptr<arrow::ipc::RecordBatchWriter> m_writer;

    std::unique_ptr<arrow::FixedSizeBinaryBuilder> m_read_id_builder;
    SignalBuilderVariant m_signal_builder;
    std::unique_ptr<arrow::UInt32Builder> m_samples_builder;

    std::size_t m_written_batched_row_count = 0;
    std::size_t m_current_batch_row_count = 0;
};

/// \brief Make a new writer for a signal table.
/// \param sink Sink to be used for output of the table.
/// \param metadata Metadata to be applied to the table schema.
/// \param table_batch_size The size of each batch written for the table.
/// \param pool Pool to be used for building table in memory.
/// \returns The writer for the new table.
POD5_FORMAT_EXPORT Result<SignalTableWriter> make_signal_table_writer(
    std::shared_ptr<FileOutputStream> const & sink,
    std::shared_ptr<arrow::KeyValueMetadata const> const & metadata,
    std::size_t table_batch_size,
    SignalType compression_type,
    arrow::MemoryPool * pool);

}  // namespace pod5


================================================
FILE: c++/pod5_format/svb16/common.hpp
================================================
#pragma once

#if __cplusplus >= 201703L
#define SVB16_IF_CONSTEXPR if constexpr
#else
#define SVB16_IF_CONSTEXPR if
#endif

#ifdef _MSC_VER
#define SVB_RESTRICT __restrict
#else
#define SVB_RESTRICT __restrict__
#endif

#if defined(__x86_64__) || defined(_M_AMD64)  // x64
#define SVB16_X64
#elif defined(__arm__) || defined(__aarch64__)
#define SVB16_ARM
#endif

#ifndef __has_builtin
#define __has_builtin(x) 0
#endif

#if __has_builtin(__builtin_popcount)
// likely to be a single instruction (POPCNT) on x86_64
#define svb16_popcount __builtin_popcount
#else
// optimising compilers can often convert this pattern to POPCNT on x86_64
inline int svb16_popcount(unsigned int i)
{
    i = i - ((i >> 1) & 0x55555555);                 // add pairs of bits
    i = (i & 0x33333333) + ((i >> 2) & 0x33333333);  // quads
    i = (i + (i >> 4)) & 0x0F0F0F0F;                 // groups of 8
    return (i * 0x01010101) >> 24;                   // horizontal sum of bytes
}
#endif


================================================
FILE: c++/pod5_format/svb16/decode.hpp
================================================
#pragma once

#include "common.hpp"
#include "decode_scalar.hpp"
#include "svb16.h"  // svb16_key_length

#include <type_traits>

#ifdef SVB16_X64
#include "decode_x64.hpp"
#include "simd_detect_x64.hpp"
#endif

namespace svb16 {

// Required extra space after readable buffers passed in.
//
// Require 1 128 bit buffer beyond the end of all input readable buffers.
inline std::size_t decode_input_buffer_padding_byte_count()
{
#ifdef SVB16_X64
    return sizeof(__m128i);
#else
    return 0;
#endif
}

template <typename Int16T, bool UseDelta, bool UseZigzag>
size_t decode(gsl::span<Int16T> out, gsl::span<uint8_t const> in, Int16T prev = 0)
{
    auto keys_length = ::svb16_key_length(out.size());
    auto const keys = in.subspan(0, keys_length);
    auto const data = in.subspan(keys_length);
#ifdef SVB16_X64
    if (has_sse4_1()) {
        return decode_sse<Int16T, UseDelta, UseZigzag>(out, keys, data, prev) - in.begin();
    }
#endif
    return decode_scalar<Int16T, UseDelta, UseZigzag>(out, keys, data, prev) - in.begin();
}

inline bool validate(gsl::span<uint8_t const> compressed_input, std::size_t out_size)
{
    auto const keys_length = ::svb16_key_length(out_size);
    if (keys_length > compressed_input.size()) {
        return false;
    }

    // Pull out the parts of the input data.
    auto const keys_span = compressed_input.subspan(0, keys_length);
    auto const data_span = compressed_input.subspan(keys_length);
    auto keys_ptr = keys_span.begin();

    // Accumulate the key sizes in a wider type to avoid overflow.
    using Accumulator = std::
        conditional_t<sizeof(std::size_t) >= sizeof(std::uint64_t), std::size_t, std::uint64_t>;
    Accumulator encoded_size = 0;

    // Give the compiler a hint that it can avoid branches in the inner loop.
    for (std::size_t c = 0; c < out_size / 8; c++) {
        uint8_t const key_byte = *keys_ptr++;
        for (uint8_t shift = 0; shift < 8; shift++) {
            uint8_t const code = (key_byte >> shift) & 0x01;
            encoded_size += code + 1;
        }
    }
    out_size &= 7;

    // Process the remainder one at a time.
    uint8_t shift = 0;
    uint8_t key_byte = *keys_ptr++;
    for (std::size_t c = 0; c < out_size; c++) {
        if (shift == 8) {
            shift = 0;
            key_byte = *keys_ptr++;
        }
        uint8_t const code = (key_byte >> shift) & 0x01;
        encoded_size += code + 1;
        shift++;
    }

    return encoded_size == data_span.size();
}

}  // namespace svb16


================================================
FILE: c++/pod5_format/svb16/decode_scalar.hpp
================================================
#pragma once

#include "common.hpp"

#include <gsl/gsl-lite.hpp>

#include <cassert>
#include <cstddef>
#include <cstdint>
#include <cstring>

namespace svb16 {
namespace detail {
inline uint16_t zigzag_decode(uint16_t val)
{
    return (val >> 1) ^ static_cast<uint16_t>(0 - (val & 1));
}

inline uint16_t decode_data(gsl::span<uint8_t const>::iterator & dataPtr, uint8_t code)
{
    uint16_t val;

    if (code == 0) {  // 1 byte
        val = (uint16_t)*dataPtr;
        dataPtr += 1;
    } else {  // 2 bytes
        val = 0;
        memcpy(&val, dataPtr, 2);  // assumes little endian
        dataPtr += 2;
    }

    return val;
}
}  // namespace detail

template <typename Int16T, bool UseDelta, bool UseZigzag>
uint8_t const * decode_scalar(
    gsl::span<Int16T> out_span,
    gsl::span<uint8_t const> keys_span,
    gsl::span<uint8_t const> data_span,
    Int16T prev = 0)
{
    auto const count = out_span.size();
    if (count == 0) {
        return data_span.begin();
    }

    auto out = out_span.begin();
    auto keys = keys_span.begin();
    auto data = data_span.begin();

    uint8_t shift = 0;  // cycles 0 through 7 then resets
    uint8_t key_byte = *keys++;
    // need to do the arithmetic in unsigned space so it wraps
    auto u_prev = static_cast<uint16_t>(prev);
    for (uint32_t c = 0; c < count; c++, shift++) {
        if (shift == 8) {
            shift = 0;
            key_byte = *keys++;
        }
        uint16_t value = detail::decode_data(data, (key_byte >> shift) & 0x01);
        SVB16_IF_CONSTEXPR(UseZigzag) { value = detail::zigzag_decode(value); }
        SVB16_IF_CONSTEXPR(UseDelta)
        {
            value += u_prev;
            u_prev = value;
        }
        *out++ = static_cast<Int16T>(value);
    }

    assert(out == out_span.end());
    assert(keys == keys_span.end());
    assert(data <= data_span.end());
    return data;
}

}  // namespace svb16


================================================
FILE: c++/pod5_format/svb16/decode_x64.hpp
================================================
#pragma once

#include "common.hpp"
#include "decode_scalar.hpp"
#include "intrinsics.hpp"
#include "shuffle_tables.hpp"
#include "svb16.h"  // svb16_key_length

#include <gsl/gsl-lite.hpp>

#include <cstddef>
#include <cstdint>

#ifdef SVB16_X64

namespace svb16 {
namespace detail {
[[gnu::target("ssse3")]] inline __m128i zigzag_decode(__m128i val)
{
    return _mm_xor_si128(
        // N >> 1
        _mm_srli_epi16(val, 1),
        // 0xFFFF if N & 1 else 0x0000
        _mm_srai_epi16(_mm_slli_epi16(val, 15), 15)
        // alternative: _mm_sign_epi16(ones, _mm_slli_epi16(buf, 15))
    );
}

[[gnu::target("ssse3")]] inline __m128i unpack(uint32_t key, uint8_t const * SVB_RESTRICT * data)
{
    auto const len = static_cast<uint8_t>(8 + svb16_popcount(key));
    __m128i data_reg = _mm_loadu_si128(reinterpret_cast<__m128i const *>(*data));
    __m128i const shuffle = *reinterpret_cast<__m128i const *>(&g_decode_shuffle_table[key]);

    data_reg = _mm_shuffle_epi8(data_reg, shuffle);
    *data += len;

    return data_reg;
}

template <typename Int16T, bool UseDelta, bool UseZigzag>
[[gnu::target("ssse3")]] inline void store_8(Int16T * to, __m128i value, __m128i * prev)
{
    SVB16_IF_CONSTEXPR(UseZigzag) { value = zigzag_decode(value); }

    SVB16_IF_CONSTEXPR(UseDelta)
    {
        auto const broadcast_last_16 =
            m128i_from_bytes(14, 15, 14, 15, 14, 15, 14, 15, 14, 15, 14, 15, 14, 15, 14, 15);
        // value == [A B C D E F G H] (16 bit values)
        __m128i add = _mm_slli_si128(value, 2);
        // add   == [- A B C D E F G]
        *prev = _mm_shuffle_epi8(*prev, broadcast_last_16);
        // *prev == [P P P P P P P P]
        value = _mm_add_epi16(value, add);
        // value == [A AB BC CD DE FG GH]
        add = _mm_slli_si128(value, 4);
        // add   == [- - A AB BC CD DE EF]
        value = _mm_add_epi16(value, add);
        // value == [A AB ABC ABCD BCDE CDEF DEFG EFGH]
        add = _mm_slli_si128(value, 8);
        // add   == [- - - - A AB ABC ABCD]
        value = _mm_add_epi16(value, add);
        // value == [A AB ABC ABCD ABCDE ABCDEF ABCDEFG ABCDEFGH]
        value = _mm_add_epi16(value, *prev);
        // value == [PA PAB PABC PABCD PABCDE PABCDEF PABCDEFG PABCDEFGH]
        *prev = value;
    }

    _mm_storeu_si128(reinterpret_cast<__m128i *>(to), value);
}
}  // namespace detail

template <typename Int16T, bool UseDelta, bool UseZigzag>
[[gnu::target("sse4.1")]] uint8_t const * decode_sse(
    gsl::span<Int16T> out_span,
    gsl::span<uint8_t const> keys_span,
    gsl::span<uint8_t const> data_span,
    Int16T prev = 0)
{
    auto store_8 = [](Int16T * to, __m128i value, __m128i * prev) {
        detail::store_8<Int16T, UseDelta, UseZigzag>(to, value, prev);
    };
    // this code treats all input as uint16_t (except the zigzag code, which treats it as int16_t)
    // this isn't a problem, as the scalar code does the same

    auto out = out_span.begin();
    auto const count = out_span.size();
    auto keys_it = keys_span.begin();
    auto data = data_span.begin();

    // handle blocks of 32 values
    if (count >= 64) {
        size_t const key_bytes = count / 8;

        __m128i prev_reg;
        SVB16_IF_CONSTEXPR(UseDelta) { prev_reg = _mm_set1_epi16(prev); }

        int64_t offset = -static_cast<int64_t>(key_bytes) / 8 + 1;  // 8 -> 4?
        uint64_t const * keyPtr64 = reinterpret_cast<uint64_t const *>(keys_it) - offset;
        uint64_t nextkeys;
        memcpy(&nextkeys, keyPtr64 + offset, sizeof(nextkeys));

        __m128i data_reg;

        for (; offset != 0; ++offset) {
            uint64_t keys = nextkeys;
            memcpy(&nextkeys, keyPtr64 + offset + 1, sizeof(nextkeys));
            // faster 16-bit delta since we only have 8-bit values
            if (!keys) {  // 64 1-byte ints in a row

                // _mm_cvtepu8_epi16: SSE4.1
                data_reg =
                    _mm_cvtepu8_epi16(_mm_lddqu_si128(reinterpret_cast<__m128i const *>(data)));
                store_8(out, data_reg, &prev_reg);
                data_reg =
                    _mm_cvtepu8_epi16(_mm_lddqu_si128(reinterpret_cast<__m128i const *>(data + 8)));
                store_8(out + 8, data_reg, &prev_reg);
                data_reg = _mm_cvtepu8_epi16(
                    _mm_lddqu_si128(reinterpret_cast<__m128i const *>(data + 16)));
                store_8(out + 16, data_reg, &prev_reg);
                data_reg = _mm_cvtepu8_epi16(
                    _mm_lddqu_si128(reinterpret_cast<__m128i const *>(data + 24)));
                store_8(out + 24, data_reg, &prev_reg);
                data_reg = _mm_cvtepu8_epi16(
                    _mm_lddqu_si128(reinterpret_cast<__m128i const *>(data + 32)));
                store_8(out + 32, data_reg, &prev_reg);
                data_reg = _mm_cvtepu8_epi16(
                    _mm_lddqu_si128(reinterpret_cast<__m128i const *>(data + +40)));
                store_8(out + 40, data_reg, &prev_reg);
                data_reg = _mm_cvtepu8_epi16(
                    _mm_lddqu_si128(reinterpret_cast<__m128i const *>(data + 48)));
                store_8(out + 48, data_reg, &prev_reg);
                data_reg = _mm_cvtepu8_epi16(
                    _mm_lddqu_si128(reinterpret_cast<__m128i const *>(data + 56)));
                store_8(out + 56, data_reg, &prev_reg);
                out += 64;
                data += 64;
                continue;
            }

            data_reg = detail::unpack(keys & 0x00FF, &data);
            store_8(out, data_reg, &prev_reg);
            data_reg = detail::unpack((keys & 0xFF00) >> 8, &data);
            store_8(out + 8, data_reg, &prev_reg);

            keys >>= 16;
            data_reg = detail::unpack((keys & 0x00FF), &data);
            store_8(out + 16, data_reg, &prev_reg);
            data_reg = detail::unpack((keys & 0xFF00) >> 8, &data);
            store_8(out + 24, data_reg, &prev_reg);

            keys >>= 16;
            data_reg = detail::unpack((keys & 0x00FF), &data);
            store_8(out + 32, data_reg, &prev_reg);
            data_reg = detail::unpack((keys & 0xFF00) >> 8, &data);
            store_8(out + 40, data_reg, &prev_reg);

            keys >>= 16;
            data_reg = detail::unpack((keys & 0x00FF), &data);
            store_8(out + 48, data_reg, &prev_reg);

            // Note we load at least sizeof(__m128i) bytes from the end of data
            // here, need to ensure that is available to read.
            //
            // But we might not use it all depending on the unpacking.
            //
            // This is ok due to `decode_input_buffer_padding_byte_count` enuring
            // extra space on the input buffer.
            data_reg = detail::unpack((keys & 0xFF00) >> 8, &data);
            store_8(out + 56, data_reg, &prev_reg);

            out += 64;
        }
        {
            uint64_t keys = nextkeys;
            // faster 16-bit delta since we only have 8-bit values
            if (!keys) {  // 64 1-byte ints in a row
                data_reg =
                    _mm_cvtepu8_epi16(_mm_lddqu_si128(reinterpret_cast<__m128i const *>(data)));
                store_8(out, data_reg, &prev_reg);
                data_reg =
                    _mm_cvtepu8_epi16(_mm_lddqu_si128(reinterpret_cast<__m128i const *>(data + 8)));
                store_8(out + 8, data_reg, &prev_reg);
                data_reg = _mm_cvtepu8_epi16(
                    _mm_lddqu_si128(reinterpret_cast<__m128i const *>(data + 16)));
                store_8(out + 16, data_reg, &prev_reg);
                data_reg = _mm_cvtepu8_epi16(
                    _mm_lddqu_si128(reinterpret_cast<__m128i const *>(data + 24)));
                store_8(out + 24, data_reg, &prev_reg);
                data_reg = _mm_cvtepu8_epi16(
                    _mm_lddqu_si128(reinterpret_cast<__m128i const *>(data + 32)));
                store_8(out + 32, data_reg, &prev_reg);
                data_reg = _mm_cvtepu8_epi16(
                    _mm_lddqu_si128(reinterpret_cast<__m128i const *>(data + +40)));
                store_8(out + 40, data_reg, &prev_reg);
                data_reg = _mm_cvtepu8_epi16(
                    _mm_lddqu_si128(reinterpret_cast<__m128i const *>(data + 48)));
                store_8(out + 48, data_reg, &prev_reg);
                // Only load the first 8 bytes here, otherwise we may run off the end of the buffer
                data_reg = _mm_cvtepu8_epi16(
                    _mm_loadl_epi64(reinterpret_cast<__m128i const *>(data + 56)));
                store_8(out + 56, data_reg, &prev_reg);
                out += 64;
                data += 64;

            } else {
                data_reg = detail::unpack(keys & 0x00FF, &data);
                store_8(out, data_reg, &prev_reg);
                data_reg = detail::unpack((keys & 0xFF00) >> 8, &data);
                store_8(out + 8, data_reg, &prev_reg);

                keys >>= 16;
                data_reg = detail::unpack((keys & 0x00FF), &data);
                store_8(out + 16, data_reg, &prev_reg);
                data_reg = detail::unpack((keys & 0xFF00) >> 8, &data);
                store_8(out + 24, data_reg, &prev_reg);

                keys >>= 16;
                data_reg = detail::unpack((keys & 0x00FF), &data);
                store_8(out + 32, data_reg, &prev_reg);
                data_reg = detail::unpack((keys & 0xFF00) >> 8, &data);
                store_8(out + 40, data_reg, &prev_reg);

                keys >>= 16;
                data_reg = detail::unpack((keys & 0x00FF), &data);
                store_8(out + 48, data_reg, &prev_reg);
                data_reg = detail::unpack((keys & 0xFF00) >> 8, &data);
                store_8(out + 56, data_reg, &prev_reg);

                out += 64;
            }
        }
        prev = out[-1];

        keys_it += key_bytes - (key_bytes & 7);
    }

    assert(out <= out_span.end());
    assert(keys_it <= keys_span.end());
    assert(data <= data_span.end());

    auto out_scalar_span = gsl::make_span(out, out_span.end());
    assert(out_scalar_span.size() == (count & 63));

    auto keys_scalar_span = gsl::make_span(keys_it, keys_span.end());
    auto data_scalar_span = gsl::make_span(data, data_span.end());

    return decode_scalar<Int16T, UseDelta, UseZigzag>(
        out_scalar_span, keys_scalar_span, data_scalar_span, prev);
}

#endif  // SVB16_X64

}  // namespace svb16


================================================
FILE: c++/pod5_format/svb16/encode.hpp
================================================
#pragma once

#include "common.hpp"
#include "encode_scalar.hpp"
#include "svb16.h"  // svb16_key_length
#ifdef SVB16_X64
#include "encode_x64.hpp"
#include "simd_detect_x64.hpp"
#endif

namespace svb16 {

template <typename Int16T, bool UseDelta, bool UseZigzag>
size_t encode(Int16T const * in, uint8_t * SVB_RESTRICT out, uint32_t count, Int16T prev = 0)
{
    auto const keys = out;
    auto const data = keys + ::svb16_key_length(count);
#ifdef SVB16_X64
    if (has_ssse3()) {
        return encode_sse<Int16T, UseDelta, UseZigzag>(in, keys, data, count, prev) - out;
    }
#endif
    return encode_scalar<Int16T, UseDelta, UseZigzag>(in, keys, data, count, prev) - out;
}

}  // namespace svb16


================================================
FILE: c++/pod5_format/svb16/encode_scalar.hpp
================================================
#pragma once

#include "common.hpp"

#include <cstddef>
#include <cstdint>
#include <cstring>

namespace svb16 {
namespace detail {
inline uint16_t zigzag_encode(uint16_t val)
{
    return (val + val) ^ static_cast<uint16_t>(static_cast<int16_t>(val) >> 15);
}
}  // namespace detail

template <typename Int16T, bool UseDelta, bool UseZigzag>
uint8_t * encode_scalar(
    Int16T const * in,
    uint8_t * SVB_RESTRICT keys,
    uint8_t * SVB_RESTRICT data,
    uint32_t count,
    Int16T prev = 0)
{
    if (count == 0) {
        return data;
    }

    uint8_t shift = 0;  // cycles 0 through 7 then resets
    uint8_t key_byte = 0;
    for (uint32_t c = 0; c < count; c++) {
        if (shift == 8) {
            shift = 0;
            *keys++ = key_byte;
            key_byte = 0;
        }
        uint16_t value;
        SVB16_IF_CONSTEXPR(UseDelta)
        {
            // need to do the arithmetic in unsigned space so it wraps
            value = static_cast<uint16_t>(in[c]) - static_cast<uint16_t>(prev);
            SVB16_IF_CONSTEXPR(UseZigzag) { value = detail::zigzag_encode(value); }
            prev = in[c];
        }
        else SVB16_IF_CONSTEXPR(UseZigzag) {
            value = detail::zigzag_encode(static_cast<uint16_t>(in[c]));
        }
        else {
            value = static_cast<uint16_t>(in[c]);
        }

        if (value < (1 << 8)) {  // 1 byte
            *data = static_cast<uint8_t>(value);
            ++data;
        } else {                           // 2 bytes
            std::memcpy(data, &value, 2);  // assumes little endian
            data += 2;
            key_byte |= 1 << shift;
        }

        shift += 1;
    }

    *keys = key_byte;  // write last key (no increment needed)
    return data;
}

}  // namespace svb16


================================================
FILE: c++/pod5_format/svb16/encode_x64.hpp
================================================
#pragma once

#include "common.hpp"
#include "encode_scalar.hpp"
#include "intrinsics.hpp"
#include "shuffle_tables.hpp"
#include "svb16.h"  // svb16_key_length

#include <cstddef>
#include <cstdint>

#ifdef SVB16_X64

namespace svb16 {
namespace detail {
[[gnu::target("ssse3")]] inline __m128i delta(__m128i curr, __m128i prev)
{
    return _mm_sub_epi16(curr, _mm_alignr_epi8(curr, prev, 14));
}

[[gnu::target("ssse3")]] inline __m128i zigzag_encode(__m128i val)
{
    return _mm_xor_si128(_mm_add_epi16(val, val), _mm_srai_epi16(val, 16));
}

template <typename Int16T, bool UseDelta, bool UseZigzag>
[[gnu::target("ssse3")]] inline __m128i load_8(Int16T const * from, __m128i * prev)
{
    auto const loaded = _mm_loadu_si128(reinterpret_cast<__m128i const *>(from));
    SVB16_IF_CONSTEXPR(UseDelta && UseZigzag)
    {
        auto const result = delta(loaded, *prev);
        *prev = loaded;
        return zigzag_encode(result);
    }
    else SVB16_IF_CONSTEXPR(UseDelta) {
        auto const result = delta(loaded, *prev);
        *prev = loaded;
        return result;
    }
    else SVB16_IF_CONSTEXPR(UseZigzag) {
        return zigzag_encode(loaded);
    }
    else {
        return loaded;
    }
}
}  // namespace detail

template <typename Int16T, bool UseDelta, bool UseZigzag>
[[gnu::target("ssse3")]] uint8_t * encode_sse(
    Int16T const * in,
    uint8_t * SVB_RESTRICT keys_dest,
    uint8_t * SVB_RESTRICT data_dest,
    uint32_t count,
    Int16T prev = 0)
{
    // this code treats all input as uint16_t (except the zigzag code, which treats it as int16_t)
    // this isn't a problem, as the scalar code does the same
    __m128i prev_reg;
    SVB16_IF_CONSTEXPR(UseDelta) { prev_reg = _mm_set1_epi16(prev); }
    //auto const key_len = svb16_key_length(count);
    auto const mask_01 = detail::m128i_from_bytes(
        0x01,
        0x01,
        0x01,
        0x01,
        0x01,
        0x01,
        0x01,
        0x01,
        0x01,
        0x01,
        0x01,
        0x01,
        0x01,
        0x01,
        0x01,
        0x01);
    for (Int16T const * end = &in [(count & ~15)]; in != end; in += 16) {
        // load up 16 values into r0 and r1
        auto r0 = detail::load_8<Int16T, UseDelta, UseZigzag>(in, &prev_reg);
        auto r1 = detail::load_8<Int16T, UseDelta, UseZigzag>(in + 8, &prev_reg);

        // 1 byte per input byte: 1 if the byte is set, 0 if not
        auto r2 = _mm_min_epu8(mask_01, r0);
        auto r3 = _mm_min_epu8(mask_01, r1);
        // 1 byte per input Int16T: FF if the MSB is set, 00 or 01 if not
        // (us = unsigned saturation)
        r2 = _mm_packus_epi16(r2, r3);
        // 1 bit per input Int16T: 1 if the MSB is set, 0 if not
        // only the low 16 bits are set
        auto const keys = static_cast<uint16_t>(_mm_movemask_epi8(r2));

        // use the shuffle table to discard the MSB if the corresponidng key bit is not set
        r2 = _mm_loadu_si128((__m128i *)&g_encode_shuffle_table[(keys << 4) & 0x07F0]);
        r3 = _mm_loadu_si128((__m128i *)&g_encode_shuffle_table[(keys >> 4) & 0x07F0]);
        r0 = _mm_shuffle_epi8(r0, r2);
        r1 = _mm_shuffle_epi8(r1, r3);

        // store the data to data_dest (note that we often end up with overlapping writes)
        _mm_storeu_si128(reinterpret_cast<__m128i *>(data_dest), r0);
        data_dest += 8 + svb16_popcount(keys & 0xFF);
        _mm_storeu_si128(reinterpret_cast<__m128i *>(data_dest), r1);
        data_dest += 8 + svb16_popcount(keys >> 8);

        *reinterpret_cast<uint16_t *>(keys_dest) = keys;
        keys_dest += 2;
    }

    SVB16_IF_CONSTEXPR(UseDelta) { prev = _mm_extract_epi16(prev_reg, 7); }
    // max two control bytes (16 values) left, use the scalar function
    count &= 15;
    return encode_scalar<Int16T, UseDelta, UseZigzag>(in, keys_dest, data_dest, count, prev);
}

#endif  // SVB16_X64

}  // namespace svb16


================================================
FILE: c++/pod5_format/svb16/generate_shuffle_tables.py
================================================
def encode_table_row(control):
    table = []
    for i in range(7):
        offset = i * 2
        # first byte
        table.append(offset)
        if (control >> i) & 1:
            table.append(offset + 1)
    final_offset = 14
    for j in range(2):
        table.append(final_offset + j)
    for i in range(16 - len(table)):
        table.append(0xFF)
    return table


def decode_table_row(control):
    table = []
    offset = 0
    for i in range(8):
        table.append(offset)
        offset += 1
        if (control >> i) & 1:
            table.append(offset)
            offset += 1
        else:
            table.append(0xFF)
    return table


def print_x64_encode_table():
    print("static constexpr uint8_t g_encode_shuffle_table[128*16] = {")
    for i in range(128):
        table = encode_table_row(i)
        print("\t", ", ".join(f"0x{v:02X}" for v in table), ",", sep="")
    print("};\n\n")


def print_x64_decode_table():
    print("static const uint8_t g_decode_shuffle_table[256][16] = {")
    for i in range(256):
        table = decode_table_row(i)
        print("\t{ ", ", ".join(f"0x{v:02X}" for v in table), "},", sep="")
    print("};\n\n")


if __name__ == "__main__":
    print("#pragma once")
    print('#include "common.hpp" // arch macros')
    print("#include <cstdint>")
    print()
    print("#ifdef SVB16_X64")
    print_x64_encode_table()
    print_x64_decode_table()
    print("#endif")


================================================
FILE: c++/pod5_format/svb16/intrinsics.hpp
================================================
#pragma once

#include "common.hpp"  // architecture macros

#if defined(_MSC_VER)
#include <intrin.h>
#elif defined(__GNUC__) && defined(SVB16_X64)
#include <x86intrin.h>
#elif defined(__GNUC__) && defined(__ARM_NEON__)
#include <arm_neon.h>
#endif

#include <cstdint>

namespace svb16 { namespace detail {
[[gnu::target("sse2")]] inline constexpr __m128i m128i_from_bytes(
    uint8_t a,
    uint8_t b,
    uint8_t c,
    uint8_t d,
    uint8_t e,
    uint8_t f,
    uint8_t g,
    uint8_t h,
    uint8_t i,
    uint8_t j,
    uint8_t k,
    uint8_t l,
    uint8_t m,
    uint8_t n,
    uint8_t o,
    uint8_t p)
{
#ifdef _MSC_VER
    return __m128i{
        (char)a,
        (char)b,
        (char)c,
        (char)d,
        (char)e,
        (char)f,
        (char)g,
        (char)h,
        (char)i,
        (char)j,
        (char)k,
        (char)l,
        (char)m,
        (char)n,
        (char)o,
        (char)p};
#else
    return __m128i{
        static_cast<int64_t>(static_cast<uint64_t>(h) << 56) + (static_cast<int64_t>(g) << 48)
            + (static_cast<int64_t>(f) << 40) + (static_cast<int64_t>(e) << 32)
            + (static_cast<int64_t>(d) << 24) + (static_cast<int64_t>(c) << 16)
            + (static_cast<int64_t>(b) << 8) + static_cast<int64_t>(a),
        static_cast<int64_t>(static_cast<uint64_t>(h) << 56) + (static_cast<int64_t>(g) << 48)
            + (static_cast<int64_t>(f) << 40) + (static_cast<int64_t>(e) << 32)
            + (static_cast<int64_t>(d) << 24) + (static_cast<int64_t>(c) << 16)
            + (static_cast<int64_t>(b) << 8) + static_cast<int64_t>(a)};
#endif
}
}}  // namespace svb16::detail


================================================
FILE: c++/pod5_format/svb16/shuffle_tables.hpp
================================================
#pragma once
#include "common.hpp"  // arch macros

#include <cstdint>

#ifdef SVB16_X64
static constexpr uint8_t g_encode_shuffle_table[128 * 16] = {
    0x00, 0x02, 0x04, 0x06, 0x08, 0x0A, 0x0C, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF,
    0x00, 0x01, 0x02, 0x04, 0x06, 0x08, 0x0A, 0x0C, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF,
    0x00, 0x02, 0x03, 0x04, 0x06, 0x08, 0x0A, 0x0C, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF,
    0x00, 0x01, 0x02, 0x03, 0x04, 0x06, 0x08, 0x0A, 0x0C, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF,
    0x00, 0x02, 0x04, 0x05, 0x06, 0x08, 0x0A, 0x0C, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF,
    0x00, 0x01, 0x02, 0x04, 0x05, 0x06, 0x08, 0x0A, 0x0C, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF,
    0x00, 0x02, 0x03, 0x04, 0x05, 0x06, 0x08, 0x0A, 0x0C, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF,
    0x00, 0x01, 0x02, 0x03, 0x04, 0x05, 0x06, 0x08, 0x0A, 0x0C, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF, 0xFF,
    0x00, 0x02, 0x04, 0x06, 0x07, 0x08, 0x0A, 0x0C, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF,
    0x00, 0x01, 0x02, 0x04, 0x06, 0x07, 0x08, 0x0A, 0x0C, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF,
    0x00, 0x02, 0x03, 0x04, 0x06, 0x07, 0x08, 0x0A, 0x0C, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF,
    0x00, 0x01, 0x02, 0x03, 0x04, 0x06, 0x07, 0x08, 0x0A, 0x0C, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF, 0xFF,
    0x00, 0x02, 0x04, 0x05, 0x06, 0x07, 0x08, 0x0A, 0x0C, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF,
    0x00, 0x01, 0x02, 0x04, 0x05, 0x06, 0x07, 0x08, 0x0A, 0x0C, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF, 0xFF,
    0x00, 0x02, 0x03, 0x04, 0x05, 0x06, 0x07, 0x08, 0x0A, 0x0C, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF, 0xFF,
    0x00, 0x01, 0x02, 0x03, 0x04, 0x05, 0x06, 0x07, 0x08, 0x0A, 0x0C, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF,
    0x00, 0x02, 0x04, 0x06, 0x08, 0x09, 0x0A, 0x0C, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF,
    0x00, 0x01, 0x02, 0x04, 0x06, 0x08, 0x09, 0x0A, 0x0C, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF,
    0x00, 0x02, 0x03, 0x04, 0x06, 0x08, 0x09, 0x0A, 0x0C, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF,
    0x00, 0x01, 0x02, 0x03, 0x04, 0x06, 0x08, 0x09, 0x0A, 0x0C, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF, 0xFF,
    0x00, 0x02, 0x04, 0x05, 0x06, 0x08, 0x09, 0x0A, 0x0C, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF,
    0x00, 0x01, 0x02, 0x04, 0x05, 0x06, 0x08, 0x09, 0x0A, 0x0C, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF, 0xFF,
    0x00, 0x02, 0x03, 0x04, 0x05, 0x06, 0x08, 0x09, 0x0A, 0x0C, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF, 0xFF,
    0x00, 0x01, 0x02, 0x03, 0x04, 0x05, 0x06, 0x08, 0x09, 0x0A, 0x0C, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF,
    0x00, 0x02, 0x04, 0x06, 0x07, 0x08, 0x09, 0x0A, 0x0C, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF,
    0x00, 0x01, 0x02, 0x04, 0x06, 0x07, 0x08, 0x09, 0x0A, 0x0C, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF, 0xFF,
    0x00, 0x02, 0x03, 0x04, 0x06, 0x07, 0x08, 0x09, 0x0A, 0x0C, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF, 0xFF,
    0x00, 0x01, 0x02, 0x03, 0x04, 0x06, 0x07, 0x08, 0x09, 0x0A, 0x0C, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF,
    0x00, 0x02, 0x04, 0x05, 0x06, 0x07, 0x08, 0x09, 0x0A, 0x0C, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF, 0xFF,
    0x00, 0x01, 0x02, 0x04, 0x05, 0x06, 0x07, 0x08, 0x09, 0x0A, 0x0C, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF,
    0x00, 0x02, 0x03, 0x04, 0x05, 0x06, 0x07, 0x08, 0x09, 0x0A, 0x0C, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF,
    0x00, 0x01, 0x02, 0x03, 0x04, 0x05, 0x06, 0x07, 0x08, 0x09, 0x0A, 0x0C, 0x0E, 0x0F, 0xFF, 0xFF,
    0x00, 0x02, 0x04, 0x06, 0x08, 0x0A, 0x0B, 0x0C, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF,
    0x00, 0x01, 0x02, 0x04, 0x06, 0x08, 0x0A, 0x0B, 0x0C, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF,
    0x00, 0x02, 0x03, 0x04, 0x06, 0x08, 0x0A, 0x0B, 0x0C, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF,
    0x00, 0x01, 0x02, 0x03, 0x04, 0x06, 0x08, 0x0A, 0x0B, 0x0C, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF, 0xFF,
    0x00, 0x02, 0x04, 0x05, 0x06, 0x08, 0x0A, 0x0B, 0x0C, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF,
    0x00, 0x01, 0x02, 0x04, 0x05, 0x06, 0x08, 0x0A, 0x0B, 0x0C, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF, 0xFF,
    0x00, 0x02, 0x03, 0x04, 0x05, 0x06, 0x08, 0x0A, 0x0B, 0x0C, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF, 0xFF,
    0x00, 0x01, 0x02, 0x03, 0x04, 0x05, 0x06, 0x08, 0x0A, 0x0B, 0x0C, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF,
    0x00, 0x02, 0x04, 0x06, 0x07, 0x08, 0x0A, 0x0B, 0x0C, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF,
    0x00, 0x01, 0x02, 0x04, 0x06, 0x07, 0x08, 0x0A, 0x0B, 0x0C, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF, 0xFF,
    0x00, 0x02, 0x03, 0x04, 0x06, 0x07, 0x08, 0x0A, 0x0B, 0x0C, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF, 0xFF,
    0x00, 0x01, 0x02, 0x03, 0x04, 0x06, 0x07, 0x08, 0x0A, 0x0B, 0x0C, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF,
    0x00, 0x02, 0x04, 0x05, 0x06, 0x07, 0x08, 0x0A, 0x0B, 0x0C, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF, 0xFF,
    0x00, 0x01, 0x02, 0x04, 0x05, 0x06, 0x07, 0x08, 0x0A, 0x0B, 0x0C, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF,
    0x00, 0x02, 0x03, 0x04, 0x05, 0x06, 0x07, 0x08, 0x0A, 0x0B, 0x0C, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF,
    0x00, 0x01, 0x02, 0x03, 0x04, 0x05, 0x06, 0x07, 0x08, 0x0A, 0x0B, 0x0C, 0x0E, 0x0F, 0xFF, 0xFF,
    0x00, 0x02, 0x04, 0x06, 0x08, 0x09, 0x0A, 0x0B, 0x0C, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF,
    0x00, 0x01, 0x02, 0x04, 0x06, 0x08, 0x09, 0x0A, 0x0B, 0x0C, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF, 0xFF,
    0x00, 0x02, 0x03, 0x04, 0x06, 0x08, 0x09, 0x0A, 0x0B, 0x0C, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF, 0xFF,
    0x00, 0x01, 0x02, 0x03, 0x04, 0x06, 0x08, 0x09, 0x0A, 0x0B, 0x0C, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF,
    0x00, 0x02, 0x04, 0x05, 0x06, 0x08, 0x09, 0x0A, 0x0B, 0x0C, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF, 0xFF,
    0x00, 0x01, 0x02, 0x04, 0x05, 0x06, 0x08, 0x09, 0x0A, 0x0B, 0x0C, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF,
    0x00, 0x02, 0x03, 0x04, 0x05, 0x06, 0x08, 0x09, 0x0A, 0x0B, 0x0C, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF,
    0x00, 0x01, 0x02, 0x03, 0x04, 0x05, 0x06, 0x08, 0x09, 0x0A, 0x0B, 0x0C, 0x0E, 0x0F, 0xFF, 0xFF,
    0x00, 0x02, 0x04, 0x06, 0x07, 0x08, 0x09, 0x0A, 0x0B, 0x0C, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF, 0xFF,
    0x00, 0x01, 0x02, 0x04, 0x06, 0x07, 0x08, 0x09, 0x0A, 0x0B, 0x0C, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF,
    0x00, 0x02, 0x03, 0x04, 0x06, 0x07, 0x08, 0x09, 0x0A, 0x0B, 0x0C, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF,
    0x00, 0x01, 0x02, 0x03, 0x04, 0x06, 0x07, 0x08, 0x09, 0x0A, 0x0B, 0x0C, 0x0E, 0x0F, 0xFF, 0xFF,
    0x00, 0x02, 0x04, 0x05, 0x06, 0x07, 0x08, 0x09, 0x0A, 0x0B, 0x0C, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF,
    0x00, 0x01, 0x02, 0x04, 0x05, 0x06, 0x07, 0x08, 0x09, 0x0A, 0x0B, 0x0C, 0x0E, 0x0F, 0xFF, 0xFF,
    0x00, 0x02, 0x03, 0x04, 0x05, 0x06, 0x07, 0x08, 0x09, 0x0A, 0x0B, 0x0C, 0x0E, 0x0F, 0xFF, 0xFF,
    0x00, 0x01, 0x02, 0x03, 0x04, 0x05, 0x06, 0x07, 0x08, 0x09, 0x0A, 0x0B, 0x0C, 0x0E, 0x0F, 0xFF,
    0x00, 0x02, 0x04, 0x06, 0x08, 0x0A, 0x0C, 0x0D, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF,
    0x00, 0x01, 0x02, 0x04, 0x06, 0x08, 0x0A, 0x0C, 0x0D, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF,
    0x00, 0x02, 0x03, 0x04, 0x06, 0x08, 0x0A, 0x0C, 0x0D, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF,
    0x00, 0x01, 0x02, 0x03, 0x04, 0x06, 0x08, 0x0A, 0x0C, 0x0D, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF, 0xFF,
    0x00, 0x02, 0x04, 0x05, 0x06, 0x08, 0x0A, 0x0C, 0x0D, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF,
    0x00, 0x01, 0x02, 0x04, 0x05, 0x06, 0x08, 0x0A, 0x0C, 0x0D, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF, 0xFF,
    0x00, 0x02, 0x03, 0x04, 0x05, 0x06, 0x08, 0x0A, 0x0C, 0x0D, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF, 0xFF,
    0x00, 0x01, 0x02, 0x03, 0x04, 0x05, 0x06, 0x08, 0x0A, 0x0C, 0x0D, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF,
    0x00, 0x02, 0x04, 0x06, 0x07, 0x08, 0x0A, 0x0C, 0x0D, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF,
    0x00, 0x01, 0x02, 0x04, 0x06, 0x07, 0x08, 0x0A, 0x0C, 0x0D, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF, 0xFF,
    0x00, 0x02, 0x03, 0x04, 0x06, 0x07, 0x08, 0x0A, 0x0C, 0x0D, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF, 0xFF,
    0x00, 0x01, 0x02, 0x03, 0x04, 0x06, 0x07, 0x08, 0x0A, 0x0C, 0x0D, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF,
    0x00, 0x02, 0x04, 0x05, 0x06, 0x07, 0x08, 0x0A, 0x0C, 0x0D, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF, 0xFF,
    0x00, 0x01, 0x02, 0x04, 0x05, 0x06, 0x07, 0x08, 0x0A, 0x0C, 0x0D, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF,
    0x00, 0x02, 0x03, 0x04, 0x05, 0x06, 0x07, 0x08, 0x0A, 0x0C, 0x0D, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF,
    0x00, 0x01, 0x02, 0x03, 0x04, 0x05, 0x06, 0x07, 0x08, 0x0A, 0x0C, 0x0D, 0x0E, 0x0F, 0xFF, 0xFF,
    0x00, 0x02, 0x04, 0x06, 0x08, 0x09, 0x0A, 0x0C, 0x0D, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF,
    0x00, 0x01, 0x02, 0x04, 0x06, 0x08, 0x09, 0x0A, 0x0C, 0x0D, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF, 0xFF,
    0x00, 0x02, 0x03, 0x04, 0x06, 0x08, 0x09, 0x0A, 0x0C, 0x0D, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF, 0xFF,
    0x00, 0x01, 0x02, 0x03, 0x04, 0x06, 0x08, 0x09, 0x0A, 0x0C, 0x0D, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF,
    0x00, 0x02, 0x04, 0x05, 0x06, 0x08, 0x09, 0x0A, 0x0C, 0x0D, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF, 0xFF,
    0x00, 0x01, 0x02, 0x04, 0x05, 0x06, 0x08, 0x09, 0x0A, 0x0C, 0x0D, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF,
    0x00, 0x02, 0x03, 0x04, 0x05, 0x06, 0x08, 0x09, 0x0A, 0x0C, 0x0D, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF,
    0x00, 0x01, 0x02, 0x03, 0x04, 0x05, 0x06, 0x08, 0x09, 0x0A, 0x0C, 0x0D, 0x0E, 0x0F, 0xFF, 0xFF,
    0x00, 0x02, 0x04, 0x06, 0x07, 0x08, 0x09, 0x0A, 0x0C, 0x0D, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF, 0xFF,
    0x00, 0x01, 0x02, 0x04, 0x06, 0x07, 0x08, 0x09, 0x0A, 0x0C, 0x0D, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF,
    0x00, 0x02, 0x03, 0x04, 0x06, 0x07, 0x08, 0x09, 0x0A, 0x0C, 0x0D, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF,
    0x00, 0x01, 0x02, 0x03, 0x04, 0x06, 0x07, 0x08, 0x09, 0x0A, 0x0C, 0x0D, 0x0E, 0x0F, 0xFF, 0xFF,
    0x00, 0x02, 0x04, 0x05, 0x06, 0x07, 0x08, 0x09, 0x0A, 0x0C, 0x0D, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF,
    0x00, 0x01, 0x02, 0x04, 0x05, 0x06, 0x07, 0x08, 0x09, 0x0A, 0x0C, 0x0D, 0x0E, 0x0F, 0xFF, 0xFF,
    0x00, 0x02, 0x03, 0x04, 0x05, 0x06, 0x07, 0x08, 0x09, 0x0A, 0x0C, 0x0D, 0x0E, 0x0F, 0xFF, 0xFF,
    0x00, 0x01, 0x02, 0x03, 0x04, 0x05, 0x06, 0x07, 0x08, 0x09, 0x0A, 0x0C, 0x0D, 0x0E, 0x0F, 0xFF,
    0x00, 0x02, 0x04, 0x06, 0x08, 0x0A, 0x0B, 0x0C, 0x0D, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF,
    0x00, 0x01, 0x02, 0x04, 0x06, 0x08, 0x0A, 0x0B, 0x0C, 0x0D, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF, 0xFF,
    0x00, 0x02, 0x03, 0x04, 0x06, 0x08, 0x0A, 0x0B, 0x0C, 0x0D, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF, 0xFF,
    0x00, 0x01, 0x02, 0x03, 0x04, 0x06, 0x08, 0x0A, 0x0B, 0x0C, 0x0D, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF,
    0x00, 0x02, 0x04, 0x05, 0x06, 0x08, 0x0A, 0x0B, 0x0C, 0x0D, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF, 0xFF,
    0x00, 0x01, 0x02, 0x04, 0x05, 0x06, 0x08, 0x0A, 0x0B, 0x0C, 0x0D, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF,
    0x00, 0x02, 0x03, 0x04, 0x05, 0x06, 0x08, 0x0A, 0x0B, 0x0C, 0x0D, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF,
    0x00, 0x01, 0x02, 0x03, 0x04, 0x05, 0x06, 0x08, 0x0A, 0x0B, 0x0C, 0x0D, 0x0E, 0x0F, 0xFF, 0xFF,
    0x00, 0x02, 0x04, 0x06, 0x07, 0x08, 0x0A, 0x0B, 0x0C, 0x0D, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF, 0xFF,
    0x00, 0x01, 0x02, 0x04, 0x06, 0x07, 0x08, 0x0A, 0x0B, 0x0C, 0x0D, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF,
    0x00, 0x02, 0x03, 0x04, 0x06, 0x07, 0x08, 0x0A, 0x0B, 0x0C, 0x0D, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF,
    0x00, 0x01, 0x02, 0x03, 0x04, 0x06, 0x07, 0x08, 0x0A, 0x0B, 0x0C, 0x0D, 0x0E, 0x0F, 0xFF, 0xFF,
    0x00, 0x02, 0x04, 0x05, 0x06, 0x07, 0x08, 0x0A, 0x0B, 0x0C, 0x0D, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF,
    0x00, 0x01, 0x02, 0x04, 0x05, 0x06, 0x07, 0x08, 0x0A, 0x0B, 0x0C, 0x0D, 0x0E, 0x0F, 0xFF, 0xFF,
    0x00, 0x02, 0x03, 0x04, 0x05, 0x06, 0x07, 0x08, 0x0A, 0x0B, 0x0C, 0x0D, 0x0E, 0x0F, 0xFF, 0xFF,
    0x00, 0x01, 0x02, 0x03, 0x04, 0x05, 0x06, 0x07, 0x08, 0x0A, 0x0B, 0x0C, 0x0D, 0x0E, 0x0F, 0xFF,
    0x00, 0x02, 0x04, 0x06, 0x08, 0x09, 0x0A, 0x0B, 0x0C, 0x0D, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF, 0xFF,
    0x00, 0x01, 0x02, 0x04, 0x06, 0x08, 0x09, 0x0A, 0x0B, 0x0C, 0x0D, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF,
    0x00, 0x02, 0x03, 0x04, 0x06, 0x08, 0x09, 0x0A, 0x0B, 0x0C, 0x0D, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF,
    0x00, 0x01, 0x02, 0x03, 0x04, 0x06, 0x08, 0x09, 0x0A, 0x0B, 0x0C, 0x0D, 0x0E, 0x0F, 0xFF, 0xFF,
    0x00, 0x02, 0x04, 0x05, 0x06, 0x08, 0x09, 0x0A, 0x0B, 0x0C, 0x0D, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF,
    0x00, 0x01, 0x02, 0x04, 0x05, 0x06, 0x08, 0x09, 0x0A, 0x0B, 0x0C, 0x0D, 0x0E, 0x0F, 0xFF, 0xFF,
    0x00, 0x02, 0x03, 0x04, 0x05, 0x06, 0x08, 0x09, 0x0A, 0x0B, 0x0C, 0x0D, 0x0E, 0x0F, 0xFF, 0xFF,
    0x00, 0x01, 0x02, 0x03, 0x04, 0x05, 0x06, 0x08, 0x09, 0x0A, 0x0B, 0x0C, 0x0D, 0x0E, 0x0F, 0xFF,
    0x00, 0x02, 0x04, 0x06, 0x07, 0x08, 0x09, 0x0A, 0x0B, 0x0C, 0x0D, 0x0E, 0x0F, 0xFF, 0xFF, 0xFF,
    0x00, 0x01, 0x02, 0x04, 0x06, 0x07, 0x08, 0x09, 0x0A, 0x0B, 0x0C, 0x0D, 0x0E, 0x0F, 0xFF, 0xFF,
    0x00, 0x02, 0x03, 0x04, 0x06, 0x07, 0x08, 0x09, 0x0A, 0x0B, 0x0C, 0x0D, 0x0E, 0x0F, 0xFF, 0xFF,
    0x00, 0x01, 0x02, 0x03, 0x04, 0x06, 0x07, 0x08, 0x09, 0x0A, 0x0B, 0x0C, 0x0D, 0x0E, 0x0F, 0xFF,
    0x00, 0x02, 0x04, 0x05, 0x06, 0x07, 0x08, 0x09, 0x0A, 0x0B, 0x0C, 0x0D, 0x0E, 0x0F, 0xFF, 0xFF,
    0x00, 0x01, 0x02, 0x04, 0x05, 0x06, 0x07, 0x08, 0x09, 0x0A, 0x0B, 0x0C, 0x0D, 0x0E, 0x0F, 0xFF,
    0x00, 0x02, 0x03, 0x04, 0x05, 0x06, 0x07, 0x08, 0x09, 0x0A, 0x0B, 0x0C, 0x0D, 0x0E, 0x0F, 0xFF,
    0x00, 0x01, 0x02, 0x03, 0x04, 0x05, 0x06, 0x07, 0x08, 0x09, 0x0A, 0x0B, 0x0C, 0x0D, 0x0E, 0x0F,
};

static uint8_t const g_decode_shuffle_table[256][16] = {
    {0x00,
     0xFF,
     0x01,
     0xFF,
     0x02,
     0xFF,
     0x03,
     0xFF,
     0x04,
     0xFF,
     0x05,
     0xFF,
     0x06,
     0xFF,
     0x07,
     0xFF},
    {0x00,
     0x01,
     0x02,
     0xFF,
     0x03,
     0xFF,
     0x04,
     0xFF,
     0x05,
     0xFF,
     0x06,
     0xFF,
     0x07,
     0xFF,
     0x08,
     0xFF},
    {0x00,
     0xFF,
     0x01,
     0x02,
     0x03,
     0xFF,
     0x04,
     0xFF,
     0x05,
     0xFF,
     0x06,
     0xFF,
     0x07,
     0xFF,
     0x08,
     0xFF},
    {0x00,
     0x01,
     0x02,
     0x03,
     0x04,
     0xFF,
     0x05,
     0xFF,
     0x06,
     0xFF,
     0x07,
     0xFF,
     0x08,
     0xFF,
     0x09,
     0xFF},
    {0x00,
     0xFF,
     0x01,
     0xFF,
     0x02,
     0x03,
     0x04,
     0xFF,
     0x05,
     0xFF,
     0x06,
     0xFF,
     0x07,
     0xFF,
     0x08,
     0xFF},
    {0x00,
     0x01,
     0x02,
     0xFF,
     0x03,
     0x04,
     0x05,
     0xFF,
     0x06,
     0xFF,
     0x07,
     0xFF,
     0x08,
     0xFF,
     0x09,
     0xFF},
    {0x00,
     0xFF,
     0x01,
     0x02,
     0x03,
     0x04,
     0x05,
     0xFF,
     0x06,
     0xFF,
     0x07,
     0xFF,
     0x08,
     0xFF,
     0x09,
     0xFF},
    {0x00,
     0x01,
     0x02,
     0x03,
     0x04,
     0x05,
     0x06,
     0xFF,
     0x07,
     0xFF,
     0x08,
     0xFF,
     0x09,
     0xFF,
     0x0A,
     0xFF},
    {0x00,
     0xFF,
     0x01,
     0xFF,
     0x02,
     0xFF,
     0x03,
     0x04,
     0x05,
     0xFF,
     0x06,
     0xFF,
     0x07,
     0xFF,
     0x08,
     0xFF},
    {0x00,
     0x01,
     0x02,
     0xFF,
     0x03,
     0xFF,
     0x04,
     0x05,
     0x06,
     0xFF,
     0x07,
     0xFF,
     0x08,
     0xFF,
     0x09,
     0xFF},
    {0x00,
     0xFF,
     0x01,
     0x02,
     0x03,
     0xFF,
     0x04,
     0x05,
     0x06,
     0xFF,
     0x07,
     0xFF,
     0x08,
     0xFF,
     0x09,
     0xFF},
    {0x00,
     0x01,
     0x02,
     0x03,
     0x04,
     0xFF,
     0x05,
     0x06,
     0x07,
     0xFF,
     0x08,
     0xFF,
     0x09,
     0xFF,
     0x0A,
     0xFF},
    {0x00,
     0xFF,
     0x01,
     0xFF,
     0x02,
     0x03,
     0x04,
     0x05,
     0x06,
     0xFF,
     0x07,
     0xFF,
     0x08,
     0xFF,
     0x09,
     0xFF},
    {0x00,
     0x01,
     0x02,
     0xFF,
     0x03,
     0x04,
     0x05,
     0x06,
     0x07,
     0xFF,
     0x08,
     0xFF,
     0x09,
     0xFF,
     0x0A,
     0xFF},
    {0x00,
     0xFF,
     0x01,
     0x02,
     0x03,
     0x04,
     0x05,
     0x06,
     0x07,
     0xFF,
     0x08,
     0xFF,
     0x09,
     0xFF,
     0x0A,
     0xFF},
    {0x00,
     0x01,
     0x02,
     0x03,
     0x04,
     0x05,
     0x06,
     0x07,
     0x08,
     0xFF,
     0x09,
     0xFF,
     0x0A,
     0xFF,
     0x0B,
     0xFF},
    {0x00,
     0xFF,
     0x01,
     0xFF,
     0x02,
     0xFF,
     0x03,
     0xFF,
     0x04,
     0x05,
     0x06,
     0xFF,
     0x07,
     0xFF,
     0x08,
     0xFF},
    {0x00,
     0x01,
     0x02,
     0xFF,
     0x03,
     0xFF,
     0x04,
     0xFF,
     0x05,
     0x06,
     0x07,
     0xFF,
     0x08,
     0xFF,
     0x09,
     0xFF},
    {0x00,
     0xFF,
     0x01,
     0x02,
     0x03,
     0xFF,
     0x04,
     0xFF,
     0x05,
     0x06,
     0x07,
     0xFF,
     0x08,
     0xFF,
     0x09,
     0xFF},
    {0x00,
     0x01,
     0x02,
     0x03,
     0x04,
     0xFF,
     0x05,
     0xFF,
     0x06,
     0x07,
     0x08,
     0xFF,
     0x09,
     0xFF,
     0x0A,
     0xFF},
    {0x00,
     0xFF,
     0x01,
     0xFF,
     0x02,
     0x03,
     0x04,
     0xFF,
     0x05,
     0x06,
     0x07,
     0xFF,
     0x08,
     0xFF,
     0x09,
     0xFF},
    {0x00,
     0x01,
     0x02,
     0xFF,
     0x03,
     0x04,
     0x05,
     0xFF,
     0x06,
     0x07,
     0x08,
     0xFF,
     0x09,
     0xFF,
     0x0A,
     0xFF},
    {0x00,
     0xFF,
     0x01,
     0x02,
     0x03,
     0x04,
     0x05,
     0xFF,
     0x06,
     0x07,
     0x08,
     0xFF,
     0x09,
     0xFF,
     0x0A,
     0xFF},
    {0x00,
     0x01,
     0x02,
     0x03,
     0x04,
     0x05,
     0x06,
     0xFF,
     0x07,
     0x08,
     0x09,
     0xFF,
     0x0A,
     0xFF,
     0x0B,
     0xFF},
    {0x00,
     0xFF,
     0x01,
     0xFF,
     0x02,
     0xFF,
     0x03,
     0x04,
     0x05,
     0x06,
     0x07,
     0xFF,
     0x08,
     0xFF,
     0x09,
     0xFF},
    {0x00,
     0x01,
     0x02,
     0xFF,
     0x03,
     0xFF,
     0x04,
     0x05,
     0x06,
     0x07,
     0x08,
     0xFF,
     0x09,
     0xFF,
     0x0A,
     0xFF},
    {0x00,
     0xFF,
     0x01,
     0x02,
     0x03,
     0xFF,
     0x04,
     0x05,
     0x06,
     0x07,
     0x08,
     0xFF,
     0x09,
     0xFF,
     0x0A,
     0xFF},
    {0x00,
     0x01,
     0x02,
     0x03,
     0x04,
     0xFF,
     0x05,
     0x06,
     0x07,
     0x08,
     0x09,
     0xFF,
     0x0A,
     0xFF,
     0x0B,
     0xFF},
    {0x00,
     0xFF,
     0x01,
     0xFF,
     0x02,
     0x03,
     0x04,
     0x05,
     0x06,
     0x07,
     0x08,
     0xFF,
     0x09,
     0xFF,
     0x0A,
     0xFF},
    {0x00,
     0x01,
     0x02,
     0xFF,
     0x03,
     0x04,
     0x05,
     0x06,
     0x07,
     0x08,
     0x09,
     0xFF,
     0x0A,
     0xFF,
     0x0B,
     0xFF},
    {0x00,
     0xFF,
     0x01,
     0x02,
     0x03,
     0x04,
     0x05,
     0x06,
     0x07,
     0x08,
     0x09,
     0xFF,
     0x0A,
     0xFF,
     0x0B,
     0xFF},
    {0x00,
     0x01,
     0x02,
     0x03,
     0x04,
     0x05,
     0x06,
     0x07,
     0x08,
     0x09,
     0x0A,
     0xFF,
     0x0B,
     0xFF,
     0x0C,
     0xFF},
    {0x00,
     0xFF,
     0x01,
     0xFF,
     0x02,
     0xFF,
     0x03,
     0xFF,
     0x04,
     0xFF,
     0x05,
     0x06,
     0x07,
     0xFF,
     0x08,
     0xFF},
    {0x00,
     0x01,
     0x02,
     0xFF,
     0x03,
     0xFF,
     0x04,
     0xFF,
     0x05,
     0xFF,
     0x06,
     0x07,
     0x08,
     0xFF,
     0x09,
     0xFF},
    {0x00,
     0xFF,
     0x01,
     0x02,
     0x03,
     0xFF,
     0x04,
     0xFF,
     0x05,
     0xFF,
     0x06,
     0x07,
     0x08,
     0xFF,
     0x09,
     0xFF},
    {0x00,
     0x01,
     0x02,
     0x03,
     0x04,
     0xFF,
     0x05,
     0xFF,
     0x06,
     0xFF,
     0x07,
     0x08,
     0x09,
     0xFF,
     0x0A,
     0xFF},
    {0x00,
     0xFF,
     0x01,
     0xFF,
     0x02,
     0x03,
     0x04,
     0xFF,
     0x05,
     0xFF,
     0x06,
     0x07,
     0x08,
     0xFF,
     0x09,
     0xFF},
    {0x00,
     0x01,
     0x02,
     0xFF,
     0x03,
     0x04,
     0x05,
     0xFF,
     0x06,
     0xFF,
     0x07,
     0x08,
     0x09,
     0xFF,
     0x0A,
     0xFF},
    {0x00,
     0xFF,
     0x01,
     0x02,
     0x03,
     0x04,
     0x05,
     0xFF,
     0x06,
     0xFF,
     0x07,
     0x08,
     0x09,
     0xFF,
     0x0A,
     0xFF},
    {0x00,
     0x01,
     0x02,
     0x03,
     0x04,
     0x05,
     0x06,
     0xFF,
     0x07,
     0xFF,
     0x08,
     0x09,
     0x0A,
     0xFF,
     0x0B,
     0xFF},
    {0x00,
     0xFF,
     0x01,
     0xFF,
     0x02,
     0xFF,
     0x03,
     0x04,
     0x05,
     0xFF,
     0x06,
     0x07,
     0x08,
     0xFF,
     0x09,
     0xFF},
    {0x00,
     0x01,
     0x02,
     0xFF,
     0x03,
     0xFF,
     0x04,
     0x05,
     0x06,
     0xFF,
     0x07,
     0x08,
     0x09,
     0xFF,
     0x0A,
     0xFF},
    {0x00,
     0xFF,
     0x01,
     0x02,
     0x03,
     0xFF,
     0x04,
     0x05,
     0x06,
     0xFF,
     0x07,
     0x08,
     0x09,
     0xFF,
     0x0A,
     0xFF},
    {0x00,
     0x01,
     0x02,
     0x03,
     0x04,
     0xFF,
     0x05,
     0x06,
     0x07,
     0xFF,
     0x08,
     0x09,
     0x0A,
     0xFF,
     0x0B,
     0xFF},
    {0x00,
     0xFF,
     0x01,
     0xFF,
     0x02,
     0x03,
     0x04,
     0x05,
     0x06,
     0xFF,
     0x07,
     0x08,
     0x09,
     0xFF,
     0x0A,
     0xFF},
    {0x00,
     0x01,
     0x02,
     0xFF,
     0x03,
     0x04,
     0x05,
     0x06,
     0x07,
     0xFF,
     0x08,
     0x09,
     0x0A,
     0xFF,
     0x0B,
     0xFF},
    {0x00,
     0xFF,
     0x01,
     0x02,
     0x03,
     0x04,
     0x05,
     0x06,
     0x07,
     0xFF,
     0x08,
     0x09,
     0x0A,
     0xFF,
     0x0B,
     0xFF},
    {0x00,
     0x01,
     0x02,
     0x03,
     0x04,
     0x05,
     0x06,
     0x07,
     0x08,
     0xFF,
     0x09,
     0x0A,
     0x0B,
     0xFF,
     0x0C,
     0xFF},
    {0x00,
     0xFF,
     0x01,
     0xFF,
     0x02,
     0xFF,
     0x03,
     0xFF,
     0x04,
     0x05,
     0x06,
     0x07,
     0x08,
     0xFF,
     0x09,
     0xFF},
    {0x00,
     0x01,
     0x02,
     0xFF,
     0x03,
     0xFF,
     0x04,
     0xFF,
     0x05,
     0x06,
     0x07,
     0x08,
     0x09,
     0xFF,
     0x0A,
     0xFF},
    {0x00,
     0xFF,
     0x01,
     0x02,
     0x03,
     0xFF,
     0x04,
     0xFF,
     0x05,
     0x06,
     0x07,
     0x08,
     0x09,
     0xFF,
     0x0A,
     0xFF},
    {0x00,
     0x01,
     0x02,
     0x03,
     0x04,
     0xFF,
     0x05,
     0xFF,
     0x06,
     0x07,
     0x08,
     0x09,
     0x0A,
     0xFF,
     0x0B,
     0xFF},
    {0x00,
     0xFF,
     0x01,
     0xFF,
     0x02,
     0x03,
     0x04,
     0xFF,
     0x05,
     0x06,
     0x07,
     0x08,
     0x09,
     0xFF,
     0x0A,
     0xFF},
    {0x00,
     0x01,
     0x02,
     0xFF,
     0x03,
     0x04,
     0x05,
     0xFF,
     0x06,
     0x07,
     0x08,
     0x09,
     0x0A,
     0xFF,
     0x0B,
     0xFF},
    {0x00,
     0xFF,
     0x01,
     0x02,
     0x03,
     0x04,
     0x05,
     0xFF,
     0x06,
     0x07,
     0x08,
     0x09,
     0x0A,
     0xFF,
     0x0B,
     0xFF},
    {0x00,
     0x01,
     0x02,
     0x03,
     0x04,
     0x05,
     0x06,
     0xFF,
     0x07,
     0x08,
     0x09,
     0x0A,
     0x0B,
     0xFF,
     0x0C,
     0xFF},
    {0x00,
     0xFF,
     0x01,
     0xFF,
     0x02,
     0xFF,
     0x03,
     0x04,
     0x05,
     0x06,
     0x07,
     0x08,
     0x09,
     0xFF,
     0x0A,
     0xFF},
    {0x00,
     0x01,
     0x02,
     0xFF,
     0x03,
     0xFF,
     0x04,
     0x05,
     0x06,
     0x07,
     0x08,
     0x09,
     0x0A,
     0xFF,
     0x0B,
     0xFF},
    {0x00,
     0xFF,
     0x01,
     0x02,
     0x03,
     0xFF,
     0x04,
     0x05,
     0x06,
     0x07,
     0x08,
     0x09,
     0x0A,
     0xFF,
     0x0B,
     0xFF},
    {0x00,
     0x01,
     0x02,
     0x03,
     0x04,
     0xFF,
     0x05,
     0x06,
     0x07,
     0x08,
     0x09,
     0x0A,
     0x0B,
     0xFF,
     0x0C,
     0xFF},
    {0x00,
     0xFF,
     0x01,
     0xFF,
     0x02,
     0x03,
     0x04,
     0x05,
     0x06,
     0x07,
     0x08,
     0x09,
     0x0A,
     0xFF,
     0x0B,
     0xFF},
    {0x00,
     0x01,
     0x02,
     0xFF,
     0x03,
     0x04,
     0x05,
     0x06,
     0x07,
     0x08,
     0x09,
     0x0A,
     0x0B,
     0xFF,
     0x0C,
     0xFF},
    {0x00,
     0xFF,
     0x01,
     0x02,
     0x03,
     0x04,
     0x05,
     0x06,
     0x07,
     0x08,
     0x09,
     0x0A,
     0x0B,
     0xFF,
     0x0C,
     0xFF},
    {0x00,
     0x01,
     0x02,
     0x03,
     0x04,
     0x05,
     0x06,
     0x07,
     0x08,
     0x09,
     0x0A,
     0x0B,
     0x0C,
     0xFF,
     0x0D,
     0xFF},
    {0x00,
     0xFF,
     0x01,
     0xFF,
     0x02,
     0xFF,
     0x03,
     0xFF,
     0x04,
     0xFF,
     0x05,
     0xFF,
     0x06,
     0x07,
     0x08,
     0xFF},
    {0x00,
     0x01,
     0x02,
     0xFF,
     0x03,
     0xFF,
     0x04,
     0xFF,
     0x05,
     0xFF,
     0x06,
     0xFF,
     0x07,
     0x08,
     0x09,
     0xFF},
    {0x00,
     0xFF,
     0x01,
     0x02,
     0x03,
     0xFF,
     0x04,
     0xFF,
     0x05,
     0xFF,
     0x06,
     0xFF,
     0x07,
     0x08,
     0x09,
     0xFF},
    {0x00,
     0x01,
     0x02,
     0x03,
     0x04,
     0xFF,
     0x05,
     0xFF,
     0x06,
     0xFF,
     0x07,
     0xFF,
     0x08,
     0x09,
     0x0A,
     0xFF},
    {0x00,
     0xFF,
     0x01,
     0xFF,
     0x02,
     0x03,
     0x04,
     0xFF,
     0x05,
     0xFF,
     0x06,
     0xFF,
     0x07,
     0x08,
     0x09,
     0xFF},
    {0x00,
     0x01,
     0x02,
     0xFF,
     0x03,
     0x04,
     0x05,
     0xFF,
     0x06,
     0xFF,
     0x07,
     0xFF,
     0x08,
     0x09,
     0x0A,
     0xFF},
    {0x00,
     0xFF,
     0x01,
     0x02,
     0x03,
     0x04,
     0x05,
     0xFF,
     0x06,
     0xFF,
     0x07,
     0xFF,
     0x08,
     0x09,
     0x0A,
     0xFF},
    {0x00,
     0x01,
     0x02,
     0x03,
     0x04,
     0x05,
     0x06,
     0xFF,
     0x07,
     0xFF,
     0x08,
     0xFF,
     0x09,
     0x0A,
     0x0B,
     0xFF},
    {0x00,
     0xFF,
     0x01,
     0xFF,
     0x02,
     0xFF,
     0x03,
     0x04,
     0x05,
     0xFF,
     0x06,
     0xFF,
     0x07,
     0x08,
     0x09,
     0xFF},
    {0x00,
     0x01,
     0x02,
     0xFF,
     0x03,
     0xFF,
     0x04,
     0x05,
     0x06,
     0xFF,
     0x07,
     0xFF,
     0x08,
     0x09,
     0x0A,
     0xFF},
    {0x00,
     0xFF,
     0x01,
     0x02,
     0x03,
     0xFF,
     0x04,
     0x05,
     0x06,
     0xFF,
     0x07,
     0xFF,
     0x08,
     0x09,
     0x0A,
     0xFF},
    {0x00,
     0x01,
     0x02,
     0x03,
     0x04,
     0xFF,
     0x05,
     0x06,
     0x07,
     0xFF,
     0x08,
     0xFF,
     0x09,
     0x0A,
     0x0B,
     0xFF},
    {0x00,
     0xFF,
     0x01,
     0xFF,
     0x02,
     0x03,
     0x04,
     0x05,
     0x06,
     0xFF,
     0x07,
     0xFF,
     0x08,
     0x09,
     0x0A,
     0xFF},
    {0x00,
     0x01,
     0x02,
     0xFF,
     0x03,
     0x04,
     0x05,
     0x06,
     0x07,
     0xFF,
     0x08,
     0xFF,
     0x09,
     0x0A,
     0x0B,
     0xFF},
    {0x00,
     0xFF,
     0x01,
     0x02,
     0x03,
     0x04,
     0x05,
     0x06,
     0x07,
     0xFF,
     0x08,
     0xFF,
     0x09,
     0x0A,
     0x0B,
     0xFF},
    {0x00,
     0x01,
     0x02,
     0x03,
     0x04,
     0x05,
     0x06,
     0x07,
     0x08,
     0xFF,
     0x09,
     0xFF,
     0x0A,
     0x0B,
     0x0C,
     0xFF},
    {0x00,
     0xFF,
     0x01,
     0xFF,
     0x02,
     0xFF,
     0x03,
     0xFF,
     0x04,
     0x05,
     0x06,
     0xFF,
     0x07,
     0x08,
     0x09,
     0xFF},
    {0x00,
     0x01,
     0x02,
     0xFF,
     0x03,
     0xFF,
     0x04,
     0xFF,
     0x05,
     0x06,
     0x07,
     0xFF,
     0x08,
     0x09,
     0x0A,
     0xFF},
    {0x00,
     0xFF,
     0x01,
     0x02,
     0x03,
     0xFF,
     0x04,
     0xFF,
     0x05,
     0x06,
     0x07,
     0xFF,
     0x08,
     0x09,
     0x0A,
     0xFF},
    {0x00,
     0x01,
     0x02,
     0x03,
     0x04,
     0xFF,
     0x05,
     0xFF,
     0x06,
     0x07,
     0x08,
     0xFF,
     0x09,
     0x0A,
     0x0B,
     0xFF},
    {0x00,
     0xFF,
     0x01,
     0xFF,
     0x02,
     0x03,
     0x04,
     0xFF,
     0x05,
     0x06,
     0x07,
     0xFF,
     0x08,
     0x09,
     0x0A,
     0xFF},
    {0x00,
     0x01,
     0x02,
     0xFF,
     0x03,
     0x04,
     0x05,
     0xFF,
     0x06,
     0x07,
     0x08,
     0xFF,
     0x09,
     0x0A,
     0x0B,
     0xFF},
    {0x00,
     0xFF,
     0x01,
     0x02,
     0x03,
     0x04,
     0x05,
     0xFF,
     0x06,
     0x07,
     0x08,
     0xFF,
     0x09,
     0x0A,
     0x0B,
     0xFF},
    {0x00,
     0x01,
     0x02,
     0x03,
     0x04,
     0x05,
     0x06,
     0xFF,
     0x07,
     0x08,
     0x09,
     0xFF,
     0x0A,
     0x0B,
     0x0C,
     0xFF},
    {0x00,
     0xFF,
     0x01,
     0xFF,
     0x02,
     0xFF,
     0x03,
     0x04,
     0x05,
     0x06,
     0x07,
     0xFF,
     0x08,
     0x09,
     0x0A,
     0xFF},
    {0x00,
     0x01,
     0x02,
     0xFF,
     0x03,
     0xFF,
     0x04,
     0x05,
     0x06,
     0x07,
     0x08,
     0xFF,
     0x09,
     0x0A,
     0x0B,
     0xFF},
    {0x00,
     0xFF,
     0x01,
     0x02,
     0x03,
     0xFF,
     0x04,
     0x05,
     0x06,
     0x07,
     0x08,
     0xFF,
     0x09,
     0x0A,
     0x0B,
     0xFF},
    {0x00,
     0x01,
     0x02,
     0x03,
     0x04,
     0xFF,
     0x05,
     0x06,
     0x07,
     0x08,
     0x09,
     0xFF,
     0x0A,
     0x0B,
     0x0C,
     0xFF},
    {0x00,
     0xFF,
     0x01,
     0xFF,
     0x02,
     0x03,
     0x04,
     0x05,
     0x06,
     0x07,
     0x08,
     0xFF,
     0x09,
     0x0A,
     0x0B,
     0xFF},
    {0x00,
     0x01,
     0x02,
     0xFF,
     0x03,
     0x04,
     0x05,
     0x06,
     0x07,
     0x08,
     0x09,
     0xFF,
     0x0A,
     0x0B,
     0x0C,
     0xFF},
    {0x00,
     0xFF,
     0x01,
     0x02,
     0x03,
     0x04,
     0x05,
     0x06,
     0x07,
     0x08,
     0x09,
     0xFF,
     0x0A,
     0x0B,
     0x0C,
     0xFF},
    {0x00,
     0x01,
     0x02,
     0x03,
     0x04,
     0x05,
     0x06,
     0x07,
     0x08,
     0x09,
     0x0A,
     0xFF,
     0x0B,
     0x0C,
     0x0D,
     0xFF},
    {0x00,
     0xFF,
     0x01,
     0xFF,
     0x02,
     0xFF,
     0x03,
     0xFF,
     0x04,
     0xFF,
     0x05,
     0x06,
     0x07,
     0x08,
     0x09,
     0xFF},
    {0x00,
     0x01,
     0x02,
     0xFF,
     0x03,
     0xFF,
     0x04,
     0xFF,
     0x05,
     0xFF,
     0x06,
     0x07,
     0x08,
     0x09,
     0x0A,
     0xFF},
    {0x00,
     0xFF,
     0x01,
     0x02,
     0x03,
     0xFF,
     0x04,
     0xFF,
     0x05,
     0xFF,
     0x06,
     0x07,
     0x08,
     0x09,
     0x0A,
     0xFF},
    {0x00,
     0x01,
     0x02,
     0x03,
     0x04,
     0xFF,
     0x05,
     0xFF,
     0x06,
     0xFF,
     0x07,
     0x08,
     0x09,
     0x0A,
     0x0B,
     0xFF},
    {0x00,
     0xFF,
     0x01,
     0xFF,
     0x02,
     0x03,
     0x04,
     0xFF,
     0x05,
     0xFF,
     0x06,
     0x07,
     0x08,
     0x09,
     0x0A,
     0xFF},
    {0x00,
     0x01,
     0x02,
     0xFF,
     0x03,
     0x04,
     0x05,
     0xFF,
     0x06,
     0xFF,
     0x07,
     0x08,
     0x09,
     0x0A,
     0x0B,
     0xFF},
    {0x00,
     0xFF,
     0x01,
     0x02,
     0x03,
     0x04,
     0x05,
     0xFF,
     0x06,
     0xFF,
     0x07,
     0x08,
     0x09,
     0x0A,
     0x0B,
     0xFF},
    {0x00,
     0x01,
     0x02,
     0x03,
     0x04,
     0x05,
     0x06,
     0xFF,
     0x07,
     0xFF,
     0x08,
     0x09,
     0x0A,
     0x0B,
     0x0C,
     0xFF},
    {0x00,
     0xFF,
     0x01,
     0xFF,
     0x02,
     0xFF,
     0x03,
     0x04,
     0x05,
     0xFF,
     0x06,
     0x07,
     0x08,
     0x09,
     0x0A,
     0xFF},
    {0x00,
     0x01,
     0x02,
     0xFF,
     0x03,
     0xFF,
     0x04,
     0x05,
     0x06,
     0xFF,
     0x07,
     0x08,
     0x09,
     0x0A,
     0x0B,
     0xFF},
    {0x00,
     0xFF,
     0x01,
     0x02,
     0x03,
     0xFF,
     0x04,
     0x05,
     0x06,
     0xFF,
     0x07,
     0x08,
     0x09,
     0x0A,
     0x0B,
     0xFF},
    {0x00,
     0x01,
     0x02,
     0x03,
     0x04,
     0xFF,
     0x05,
     0x06,
     0x07,
     0xFF,
     0x08,
     0x09,
     0x0A,
     0x0B,
     0x0C,
     0xFF},
    {0x00,
     0xFF,
     0x01,
     0xFF,
     0x02,
     0x03,
     0x04,
     0x05,
     0x06,
     0xFF,
     0x07,
     0x08,
     0x09,
     0x0A,
     0x0B,
     0xFF},
    {0x00,
     0x01,
     0x02,
     0xFF,
     0x03,
     0x04,
     0x05,
     0x06,
     0x07,
     0xFF,
     0x08,
     0x09,
     0x0A,
     0x0B,
     0x0C,
     0xFF},
    {0x00,
     0xFF,
     0x01,
     0x02,
     0x03,
     0x04,
     0x05,
     0x06,
     0x07,
     0xFF,
     0x08,
     0x09,
     0x0A,
     0x0B,
     0x0C,
     0xFF},
    {0x00,
     0x01,
     0x02,
     0x03,
     0x04,
     0x05,
     0x06,
     0x07,
     0x08,
     0xFF,
     0x09,
     0x0A,
     0x0B,
     0x0C,
     0x0D,
     0xFF},
    {0x00,
     0xFF,
     0x01,
     0xFF,
     0x02,
     0xFF,
     0x03,
     0xFF,
     0x04,
     0x05,
     0x06,
     0x07,
     0x08,
     0x09,
     0x0A,
     0xFF},
    {0x00,
     0x01,
     0x02,
     0xFF,
     0x03,
     0xFF,
     0x04,
     0xFF,
     0x05,
     0x06,
     0x07,
     0x08,
     0x09,
     0x0A,
     0x0B,
     0xFF},
    {0x00,
     0xFF,
     0x01,
     0x02,
     0x03,
     0xFF,
     0x04,
     0xFF,
     0x05,
     0x06,
     0x07,
     0x08,
     0x09,
     0x0A,
     0x0B,
     0xFF},
    {0x00,
     0x01,
     0x02,
     0x03,
     0x04,
     0xFF,
     0x05,
     0xFF,
     0x06,
     0x07,
     0x08,
     0x09,
     0x0A,
     0x0B,
     0x0C,
     0xFF},
    {0x00,
     0xFF,
     0x01,
     0xFF,
     0x02,
     0x03,
     0x04,
     0xFF,
     0x05,
     0x06,
     0x07,
     0x08,
     0x09,
     0x0A,
     0x0B,
     0xFF},
    {0x00,
     0x01,
     0x02,
     0xFF,
     0x03,
     0x04,
     0x05,
     0xFF,
     0x06,
     0x07,
     0x08,
     0x09,
     0x0A,
     0x0B,
     0x0C,
     0xFF},
    {0x00,
     0xFF,
     0x01,
     0x02,
     0x03,
     0x04,
     0x05,
     0xFF,
     0x06,
     0x07,
     0x08,
     0x09,
     0x0A,
     0x0B,
     0x0C,
     0xFF},
    {0x00,
     0x01,
     0x02,
     0x03,
     0x04,
     0x05,
     0x06,
     0xFF,
     0x07,
     0x08,
     0x09,
     0x0A,
     0x0B,
     0x0C,
     0x0D,
     0xFF},
    {0x00,
     0xFF,
     0x01,
     0xFF,
     0x02,
     0xFF,
     0x03,
     0x04,
     0x05,
     0x06,
     0x07,
     0x08,
     0x09,
     0x0A,
     0x0B,
     0xFF},
    {0x00,
     0x01,
     0x02,
     0xFF,
     0x03,
     0xFF,
     0x04,
     0x05,
     0x06,
     0x07,
     0x08,
     0x09,
     0x0A,
     0x0B,
     0x0C,
     0xFF},
    {0x00,
     0xFF,
     0x01,
     0x02,
     0x03,
     0xFF,
     0x04,
     0x05,
     0x06,
     0x07,
     0x08,
     0x09,
     0x0A,
     0x0B,
     0x0C,
     0xFF},
    {0x00,
     0x01,
     0x02,
     0x03,
     0x04,
     0xFF,
     0x05,
     0x06,
     0x07,
     0x08,
     0x09,
     0x0A,
     0x0B,
     0x0C,
     0x0D,
     0xFF},
    {0x00,
     0xFF,
     0x01,
     0xFF,
     0x02,
     0x03,
     0x04,
     0x05,
     0x06,
     0x07,
     0x08,
     0x09,
     0x0A,
     0x0B,
     0x0C,
     0xFF},
    {0x00,
     0x01,
     0x02,
     0xFF,
     0x03,
     0x04,
     0x05,
     0x06,
     0x07,
     0x08,
     0x09,
     0x0A,
     0x0B,
     0x0C,
     0x0D,
     0xFF},
    {0x00,
     0xFF,
     0x01,
     0x02,
     0x03,
     0x04,
     0x05,
     0x06,
     0x07,
     0x08,
     0x09,
     0x0A,
     0x0B,
     0x0C,
     0x0D,
     0xFF},
    {0x00,
     0x01,
     0x02,
     0x03,
     0x04,
     0x05,
     0x06,
     0x07,
     0x08,
     0x09,
     0x0A,
     0x0B,
     0x0C,
     0x0D,
     0x0E,
     0xFF},
    {0x00,
     0xFF,
     0x01,
     0xFF,
     0x02,
     0xFF,
     0x03,
     0xFF,
     0x04,
     0xFF,
     0x05,
     0xFF,
     0x06,
     0xFF,
     0x07,
     0x08},
    {0x00,
     0x01,
     0x02,
     0xFF,
     0x03,
     0xFF,
     0x04,
     0xFF,
     0x05,
     0xFF,
     0x06,
     0xFF,
     0x07,
     0xFF,
     0x08,
     0x09},
    {0x00,
     0xFF,
     0x01,
     0x02,
     0x03,
     0xFF,
     0x04,
     0xFF,
     0x05,
     0xFF,
     0x06,
     0xFF,
     0x07,
     0xFF,
     0x08,
     0x09},
    {0x00,
     0x01,
     0x02,
     0x03,
     0x04,
     0xFF,
     0x05,
     0xFF,
     0x06,
     0xFF,
     0x07,
     0xFF,
     0x08,
     0xFF,
     0x09,
     0x0A},
    {0x00,
     0xFF,
     0x01,
     0xFF,
     0x02,
     0x03,
     0x04,
     0xFF,
     0x05,
     0xFF,
     0x06,
     0xFF,
     0x07,
     0xFF,
     0x08,
     0x09},
    {0x00,
     0x01,
     0x02,
     0xFF,
     0x03,
     0x04,
     0x05,
     0xFF,
     0x06,
     0xFF,
     0x07,
     0xFF,
     0x08,
     0xFF,
     0x09,
     0x0A},
    {0x00,
     0xFF,
     0x01,
     0x02,
     0x03,
     0x04,
     0x05,
     0xFF,
     0x06,
     0xFF,
     0x07,
     0xFF,
     0x08,
     0xFF,
     0x09,
     0x0A},
    {0x00,
     0x01,
     0x02,
     0x03,
     0x04,
     0x05,
     0x06,
     0xFF,
     0x07,
     0xFF,
     0x08,
     0xFF,
     0x09,
     0xFF,
     0x0A,
     0x0B},
    {0x00,
     0xFF,
     0x01,
     0xFF,
     0x02,
     0xFF,
     0x03,
     0x04,
     0x05,
     0xFF,
     0x06,
     0xFF,
     0x07,
     0xFF,
     0x08,
     0x09},
    {0x00,
     0x01,
     0x02,
     0xFF,
     0x03,
     0xFF,
     0x04,
     0x05,
     0x06,
     0xFF,
     0x07,
     0xFF,
     0x08,
     0xFF,
     0x09,
     0x0A},
    {0x00,
     0xFF,
     0x01,
     0x02,
     0x03,
     0xFF,
     0x04,
     0x05,
     0x06,
     0xFF,
     0x07,
     0xFF,
     0x08,
     0xFF,
     0x09,
     0x0A},
    {0x00,
     0x01,
     0x02,
     0x03,
     0x04,
     0xFF,
     0x05,
     0x06,
     0x07,
     0xFF,
     0x08,
     0xFF,
     0x09,
     0xFF,
     0x0A,
     0x0B},
    {0x00,
     0xFF,
     0x01,
     0xFF,
     0x02,
     0x03,
     0x04,
     0x05,
     0x06,
     0xFF,
     0x07,
     0xFF,
     0x08,
     0xFF,
     0x09,
     0x0A},
    {0x00,
     0x01,
     0x02,
     0xFF,
     0x03,
     0x04,
     0x05,
     0x06,
     0x07,
     0xFF,
     0x08,
     0xFF,
     0x09,
     0xFF,
     0x0A,
     0x0B},
    {0x00,
     0xFF,
     0x01,
     0x02,
     0x03,
     0x04,
     0x05,
     0x06,
     0x07,
     0xFF,
     0x08,
     0xFF,
     0x09,
     0xFF,
     0x0A,
     0x0B},
    {0x00,
     0x01,
     0x02,
     0x03,
     0x04,
     0x05,
     0x06,
     0x07,
     0x08,
     0xFF,
     0x09,
     0xFF,
     0x0A,
     0xFF,
     0x0B,
     0x0C},
    {0x00,
     0xFF,
     0x01,
     0xFF,
     0x02,
     0xFF,
     0x03,
     0xFF,
     0x04,
     0x05,
     0x06,
     0xFF,
     0x07,
     0xFF,
     0x08,
     0x09},
    {0x00,
     0x01,
     0x02,
     0xFF,
     0x03,
     0xFF,
     0x04,
     0xFF,
     0x05,
     0x06,
     0x07,
     0xFF,
     0x08,
     0xFF,
     0x09,
     0x0A},
    {0x00,
     0xFF,
     0x01,
     0x02,
     0x03,
     0xFF,
     0x04,
     0xFF,
     0x05,
     0x06,
     0x07,
     0xFF,
     0x08,
     0xFF,
     0x09,
     0x0A},
    {0x00,
     0x01,
     0x02,
     0x03,
     0x04,
     0xFF,
     0x05,
     0xFF,
     0x06,
     0x07,
     0x08,
     0xFF,
     0x09,
     0xFF,
     0x0A,
     0x0B},
    {0x00,
     0xFF,
     0x01,
     0xFF,
     0x02,
     0x03,
     0x04,
     0xFF,
     0x05,
     0x06,
     0x07,
     0xFF,
     0x08,
     0xFF,
     0x09,
     0x0A},
    {0x00,
     0x01,
     0x02,
     0xFF,
     0x03,
     0x04,
     0x05,
     0xFF,
     0x06,
     0x07,
     0x08,
     0xFF,
     0x09,
     0xFF,
     0x0A,
     0x0B},
    {0x00,
     0xFF,
     0x01,
     0x02,
     0x03,
     0x04,
     0x05,
     0xFF,
     0x06,
     0x07,
     0x08,
     0xFF,
     0x09,
     0xFF,
     0x0A,
     0x0B},
    {0x00,
     0x01,
     0x02,
     0x03,
     0x04,
     0x05,
     0x06,
     0xFF,
     0x07,
     0x08,
     0x09,
     0xFF,
     0x0A,
     0xFF,
     0x0B,
     0x0C},
    {0x00,
     0xFF,
     0x01,
     0xFF,
     0x02,
     0xFF,
     0x03,
     0x04,
     0x05,
     0x06,
     0x07,
     0xFF,
     0x08,
     0xFF,
     0x09,
     0x0A},
    {0x00,
     0x01,
     0x02,
     0xFF,
     0x03,
     0xFF,
     0x04,
     0x05,
     0x06,
     0x07,
     0x08,
     0xFF,
     0x09,
     0xFF,
     0x0A,
     0x0B},
    {0x00,
     0xFF,
     0x01,
     0x02,
     0x03,
     0xFF,
     0x04,
     0x05,
     0x06,
     0x07,
     0x08,
     0xFF,
     0x09,
     0xFF,
     0x0A,
     0x0B},
    {0x00,
     0x01,
     0x02,
     0x03,
     0x04,
     0xFF,
     0x05,
     0x06,
     0x07,
     0x08,
     0x09,
     0xFF,
     0x0A,
     0xFF,
     0x0B,
     0x0C},
    {0x00,
     0xFF,
     0x01,
     0xFF,
     0x02,
     0x03,
     0x04,
     0x05,
     0x06,
     0x07,
     0x08,
     0xFF,
     0x09,
     0xFF,
     0x0A,
     0x0B},
    {0x00,
     0x01,
     0x02,
     0xFF,
     0x03,
     0x04,
     0x05,
     0x06,
     0x07,
     0x08,
     0x09,
     0xFF,
     0x0A,
     0xFF,
     0x0B,
     0x0C},
    {0x00,
     0xFF,
     0x01,
     0x02,
     0x03,
     0x04,
     0x05,
     0x06,
     0x07,
     0x08,
     0x09,
     0xFF,
     0x0A,
     0xFF,
     0x0B,
     0x0C},
    {0x00,
     0x01,
     0x02,
     0x03,
     0x04,
     0x05,
     0x06,
     0x07,
     0x08,
     0x09,
     0x0A,
     0xFF,
     0x0B,
     0xFF,
     0x0C,
     0x0D},
    {0x00,
     0xFF,
     0x01,
     0xFF,
     0x02,
     0xFF,
     0x03,
     0xFF,
     0x04,
     0xFF,
     0x05,
     0x06,
     0x07,
     0xFF,
     0x08,
     0x09},
    {0x00,
     0x01,
     0x02,
     0xFF,
     0x03,
     0xFF,
     0x04,
     0xFF,
     0x05,
     0xFF,
     0x06,
     0x07,
     0x08,
     0xFF,
     0x09,
     0x0A},
    {0x00,
     0xFF,
     0x01,
     0x02,
     0x03,
     0xFF,
     0x04,
     0xFF,
     0x05,
     0xFF,
     0x06,
     0x07,
     0x08,
     0xFF,
     0x09,
     0x0A},
    {0x00,
     0x01,
     0x02,
     0x03,
     0x04,
     0xFF,
     0x05,
     0xFF,
     0x06,
     0xFF,
     0x07,
     0x08,
     0x09,
     0xFF,
     0x0A,
     0x0B},
    {0x00,
     0xFF,
     0x01,
     0xFF,
     0x02,
     0x03,
     0x04,
     0xFF,
     0x05,
     0xFF,
     0x06,
     0x07,
     0x08,
     0xFF,
     0x09,
     0x0A},
    {0x00,
     0x01,
     0x02,
     0xFF,
     0x03,
     0x04,
     0x05,
     0xFF,
     0x06,
     0xFF,
     0x07,
     0x08,
     0x09,
     0xFF,
     0x0A,
     0x0B},
    {0x00,
     0xFF,
     0x01,
     0x02,
     0x03,
     0x04,
     0x05,
     0xFF,
     0x06,
     0xFF,
     0x07,
     0x08,
     0x09,
     0xFF,
     0x0A,
     0x0B},
    {0x00,
     0x01,
     0x02,
     0x03,
     0x04,
     0x05,
     0x06,
     0xFF,
     0x07,
     0xFF,
     0x08,
     0x09,
     0x0A,
     0xFF,
     0x0B,
     0x0C},
    {0x00,
     0xFF,
     0x01,
     0xFF,
     0x02,
     0xFF,
     0x03,
     0x04,
     0x05,
     0xFF,
     0x06,
     0x07,
     0x08,
     0xFF,
     0x09,
     0x0A},
    {0x00,
     0x01,
     0x02,
     0xFF,
     0x03,
     0xFF,
     0x04,
     0x05,
     0x06,
     0xFF,
     0x07,
     0x08,
     0x09,
     0xFF,
     0x0A,
     0x0B},
    {0x00,
     0xFF,
     0x01,
     0x02,
     0x03,
     0xFF,
     0x04,
     0x05,
     0x06,
     0xFF,
     0x07,
     0x08,
     0x09,
     0xFF,
     0x0A,
     0x0B},
    {0x00,
     0x01,
     0x02,
     0x03,
     0x04,
     0xFF,
     0x05,
     0x06,
     0x07,
     0xFF,
     0x08,
     0x09,
     0x0A,
     0xFF,
     0x0B,
     0x0C},
    {0x00,
     0xFF,
     0x01,
     0xFF,
     0x02,
     0x03,
     0x04,
     0x05,
     0x06,
     0xFF,
     0x07,
     0x08,
     0x09,
     0xFF,
     0x0A,
     0x0B},
    {0x00,
     0x01,
     0x02,
     0xFF,
     0x03,
     0x04,
     0x05,
     0x06,
     0x07,
     0xFF,
     0x08,
     0x09,
     0x0A,
     0xFF,
     0x0B,
     0x0C},
    {0x00,
     0xFF,
     0x01,
     0x02,
     0x03,
     0x04,
     0x05,
     0x06,
     0x07,
     0xFF,
     0x08,
     0x09,
     0x0A,
     0xFF,
     0x0B,
     0x0C},
    {0x00,
     0x01,
     0x02,
     0x03,
     0x04,
     0x05,
     0x06,
     0x07,
     0x08,
     0xFF,
     0x09,
     0x0A,
     0x0B,
     0xFF,
     0x0C,
     0x0D},
    {0x00,
     0xFF,
     0x01,
     0xFF,
     0x02,
     0xFF,
     0x03,
     0xFF,
     0x04,
     0x05,
     0x06,
     0x07,
     0x08,
     0xFF,
     0x09,
     0x0A},
    {0x00,
     0x01,
     0x02,
     0xFF,
     0x03,
     0xFF,
     0x04,
     0xFF,
     0x05,
     0x06,
     0x07,
     0x08,
     0x09,
     0xFF,
     0x0A,
     0x0B},
    {0x00,
     0xFF,
     0x01,
     0x02,
     0x03,
     0xFF,
     0x04,
     0xFF,
     0x05,
     0x06,
     0x07,
     0x08,
     0x09,
     0xFF,
     0x0A,
     0x0B},
    {0x00,
     0x01,
     0x02,
     0x03,
     0x04,
     0xFF,
     0x05,
     0xFF,
     0x06,
     0x07,
     0x08,
     0x09,
     0x0A,
     0xFF,
     0x0B,
     0x0C},
    {0x00,
     0xFF,
     0x01,
     0xFF,
     0x02,
     0x03,
     0x04,
     0xFF,
     0x05,
     0x06,
     0x07,
     0x08,
     0x09,
     0xFF,
     0x0A,
     0x0B},
    {0x00,
     0x01,
     0x02,
     0xFF,
     0x03,
     0x04,
     0x05,
     0xFF,
     0x06,
     0x07,
     0x08,
     0x09,
     0x0A,
     0xFF,
     0x0B,
     0x0C},
    {0x00,
     0xFF,
     0x01,
     0x02,
     0x03,
     0x04,
     0x05,
     0xFF,
     0x06,
     0x07,
     0x08,
     0x09,
     0x0A,
     0xFF,
     0x0B,
     0x0C},
    {0x00,
     0x01,
     0x02,
     0x03,
     0x04,
     0x05,
     0x06,
     0xFF,
     0x07,
     0x08,
     0x09,
     0x0A,
     0x0B,
     0xFF,
     0x0C,
     0x0D},
    {0x00,
     0xFF,
     0x01,
     0xFF,
     0x02,
     0xFF,
     0x03,
     0x04,
     0x05,
     0x06,
     0x07,
     0x08,
     0x09,
     0xFF,
     0x0A,
     0x0B},
    {0x00,
     0x01,
     0x02,
     0xFF,
     0x03,
     0xFF,
     0x04,
     0x05,
     0x06,
     0x07,
     0x08,
     0x09,
     0x0A,
     0xFF,
     0x0B,
     0x0C},
    {0x00,
     0xFF,
     0x01,
     0x02,
     0x03,
     0xFF,
     0x04,
     0x05,
     0x06,
     0x07,
     0x08,
     0x09,
     0x0A,
     0xFF,
     0x0B,
     0x0C},
    {0x00,
     0x01,
     0x02,
     0x03,
     0x04,
     0xFF,
     0x05,
     0x06,
     0x07,
     0x08,
     0x09,
     0x0A,
     0x0B,
     0xFF,
     0x0C,
     0x0D},
    {0x00,
     0xFF,
     0x01,
     0xFF,
     0x02,
     0x03,
     0x04,
     0x05,
     0x06,
     0x07,
     0x08,
     0x09,
     0x0A,
     0xFF,
     0x0B,
     0x0C},
    {0x00,
     0x01,
     0x02,
     0xFF,
     0x03,
     0x04,
     0x05,
     0x06,
     0x07,
     0x08,
     0x09,
     0x0A,
     0x0B,
     0xFF,
     0x0C,
     0x0D},
    {0x00,
     0xFF,
     0x01,
     0x02,
     0x03,
     0x04,
     0x05,
     0x06,
     0x07,
     0x08,
     0x09,
     0x0A,
     0x0B,
     0xFF,
     0x0C,
     0x0D},
    {0x00,
     0x01,
     0x02,
     0x03,
     0x04,
     0x05,
     0x06,
     0x07,
     0x08,
     0x09,
     0x0A,
     0x0B,
     0x0C,
     0xFF,
     0x0D,
     0x0E},
    {0x00,
     0xFF,
     0x01,
     0xFF,
     0x02,
     0xFF,
     0x03,
     0xFF,
     0x04,
     0xFF,
     0x05,
     0xFF,
     0x06,
     0x07,
     0x08,
     0x09},
    {0x00,
     0x01,
     0x02,
     0xFF,
     0x03,
     0xFF,
     0x04,
     0xFF,
     0x05,
     0xFF,
     0x06,
     0xFF,
     0x07,
     0x08,
     0x09,
     0x0A},
    {0x00,
     0xFF,
     0x01,
     0x02,
     0x03,
     0xFF,
     0x04,
     0xFF,
     0x05,
     0xFF,
     0x06,
     0xFF,
     0x07,
     0x08,
     0x09,
     0x0A},
    {0x00,
     0x01,
     0x02,
     0x03,
     0x04,
     0xFF,
     0x05,
     0xFF,
     0x06,
     0xFF,
     0x07,
     0xFF,
     0x08,
     0x09,
     0x0A,
     0x0B},
    {0x00,
     0xFF,
     0x01,
     0xFF,
     0x02,
     0x03,
     0x04,
     0xFF,
     0x05,
     0xFF,
     0x06,
     0xFF,
     0x07,
     0x08,
     0x09,
     0x0A},
    {0x00,
     0x01,
     0x02,
     0xFF,
     0x03,
     0x04,
     0x05,
     0xFF,
     0x06,
     0xFF,
     0x07,
     0xFF,
     0x08,
     0x09,
     0x0A,
     0x0B},
    {0x00,
     0xFF,
     0x01,
     0x02,
     0x03,
     0x04,
     0x05,
     0xFF,
     0x06,
     0xFF,
     0x07,
     0xFF,
     0x08,
     0x09,
     0x0A,
     0x0B},
    {0x00,
     0x01,
     0x02,
     0x03,
     0x04,
     0x05,
     0x06,
     0xFF,
     0x07,
     0xFF,
     0x08,
     0xFF,
     0x09,
     0x0A,
     0x0B,
     0x0C},
    {0x00,
     0xFF,
     0x01,
     0xFF,
     0x02,
     0xFF,
     0x03,
     0x04,
     0x05,
     0xFF,
     0x06,
     0xFF,
     0x07,
     0x08,
     0x09,
     0x0A},
    {0x00,
     0x01,
     0x02,
     0xFF,
     0x03,
     0xFF,
     0x04,
     0x05,
     0x06,
     0xFF,
     0x07,
     0xFF,
     0x08,
     0x09,
     0x0A,
     0x0B},
    {0x00,
     0xFF,
     0x01,
     0x02,
     0x03,
     0xFF,
     0x04,
     0x05,
     0x06,
     0xFF,
     0x07,
     0xFF,
     0x08,
     0x09,
     0x0A,
     0x0B},
    {0x00,
     0x01,
     0x02,
     0x03,
     0x04,
     0xFF,
     0x05,
     0x06,
     0x07,
     0xFF,
     0x08,
     0xFF,
     0x09,
     0x0A,
     0x0B,
     0x0C},
    {0x00,
     0xFF,
     0x01,
     0xFF,
     0x02,
     0x03,
     0x04,
     0x05,
     0x06,
     0xFF,
     0x07,
     0xFF,
     0x08,
     0x09,
     0x0A,
     0x0B},
    {0x00,
     0x01,
     0x02,
     0xFF,
     0x03,
     0x04,
     0x05,
     0x06,
     0x07,
     0xFF,
     0x08,
     0xFF,
     0x09,
     0x0A,
     0x0B,
     0x0C},
    {0x00,
     0xFF,
     0x01,
     0x02,
     0x03,
     0x04,
     0x05,
     0x06,
     0x07,
     0xFF,
     0x08,
     0xFF,
     0x09,
     0x0A,
     0x0B,
     0x0C},
    {0x00,
     0x01,
     0x02,
     0x03,
     0x04,
     0x05,
     0x06,
     0x07,
     0x08,
     0xFF,
     0x09,
     0xFF,
     0x0A,
     0x0B,
     0x0C,
     0x0D},
    {0x00,
     0xFF,
     0x01,
     0xFF,
     0x02,
     0xFF,
     0x03,
     0xFF,
     0x04,
     0x05,
     0x06,
     0xFF,
     0x07,
     0x08,
     0x09,
     0x0A},
    {0x00,
     0x01,
     0x02,
     0xFF,
     0x03,
     0xFF,
     0x04,
     0xFF,
     0x05,
     0x06,
     0x07,
     0xFF,
     0x08,
     0x09,
     0x0A,
     0x0B},
    {0x00,
     0xFF,
     0x01,
     0x02,
     0x03,
     0xFF,
     0x04,
     0xFF,
     0x05,
     0x06,
     0x07,
     0xFF,
     0x08,
     0x09,
     0x0A,
     0x0B},
    {0x00,
     0x01,
     0x02,
     0x03,
     0x04,
     0xFF,
     0x05,
     0xFF,
     0x06,
     0x07,
     0x08,
     0xFF,
     0x09,
     0x0A,
     0x0B,
     0x0C},
    {0x00,
     0xFF,
     0x01,
     0xFF,
     0x02,
     0x03,
     0x04,
     0xFF,
     0x05,
     0x06,
     0x07,
     0xFF,
     0x08,
     0x09,
     0x0A,
     0x0B},
    {0x00,
     0x01,
     0x02,
     0xFF,
     0x03,
     0x04,
     0x05,
     0xFF,
     0x06,
     0x07,
     0x08,
     0xFF,
     0x09,
     0x0A,
     0x0B,
     0x0C},
    {0x00,
     0xFF,
     0x01,
     0x02,
     0x03,
     0x04,
     0x05,
     0xFF,
     0x06,
     0x07,
     0x08,
     0xFF,
     0x09,
     0x0A,
     0x0B,
     0x0C},
    {0x00,
     0x01,
     0x02,
     0x03,
     0x04,
     0x05,
     0x06,
     0xFF,
     0x07,
     0x08,
     0x09,
     0xFF,
     0x0A,
     0x0B,
     0x0C,
     0x0D},
    {0x00,
     0xFF,
     0x01,
     0xFF,
     0x02,
     0xFF,
     0x03,
     0x04,
     0x05,
     0x06,
     0x07,
     0xFF,
     0x08,
     0x09,
     0x0A,
     0x0B},
    {0x00,
     0x01,
     0x02,
     0xFF,
     0x03,
     0xFF,
     0x04,
     0x05,
     0x06,
     0x07,
     0x08,
     0xFF,
     0x09,
     0x0A,
     0x0B,
     0x0C},
    {0x00,
     0xFF,
     0x01,
     0x02,
     0x03,
     0xFF,
     0x04,
     0x05,
     0x06,
     0x07,
     0x08,
     0xFF,
     0x09,
     0x0A,
     0x0B,
     0x0C},
    {0x00,
     0x01,
     0x02,
     0x03,
     0x04,
     0xFF,
     0x05,
     0x06,
     0x07,
     0x08,
     0x09,
     0xFF,
     0x0A,
     0x0B,
     0x0C,
     0x0D},
    {0x00,
     0xFF,
     0x01,
     0xFF,
     0x02,
     0x03,
     0x04,
     0x05,
     0x06,
     0x07,
     0x08,
     0xFF,
     0x09,
     0x0A,
     0x0B,
     0x0C},
    {0x00,
     0x01,
     0x02,
     0xFF,
     0x03,
     0x04,
     0x05,
     0x06,
     0x07,
     0x08,
     0x09,
     0xFF,
     0x0A,
     0x0B,
     0x0C,
     0x0D},
    {0x00,
     0xFF,
     0x01,
     0x02,
     0x03,
     0x04,
     0x05,
     0x06,
     0x07,
     0x08,
     0x09,
     0xFF,
     0x0A,
     0x0B,
     0x0C,
     0x0D},
    {0x00,
     0x01,
     0x02,
     0x03,
     0x04,
     0x05,
     0x06,
     0x07,
     0x08,
     0x09,
     0x0A,
     0xFF,
     0x0B,
     0x0C,
     0x0D,
     0x0E},
    {0x00,
     0xFF,
     0x01,
     0xFF,
     0x02,
     0xFF,
     0x03,
     0xFF,
     0x04,
     0xFF,
     0x05,
     0x06,
     0x07,
     0x08,
     0x09,
     0x0A},
    {0x00,
     0x01,
     0x02,
     0xFF,
     0x03,
     0xFF,
     0x04,
     0xFF,
     0x05,
     0xFF,
     0x06,
     0x07,
     0x08,
     0x09,
     0x0A,
     0x0B},
    {0x00,
     0xFF,
     0x01,
     0x02,
     0x03,
     0xFF,
     0x04,
     0xFF,
     0x05,
     0xFF,
     0x06,
     0x07,
     0x08,
     0x09,
     0x0A,
     0x0B},
    {0x00,
     0x01,
     0x02,
     0x03,
     0x04,
     0xFF,
     0x05,
     0xFF,
     0x06,
     0xFF,
     0x07,
     0x08,
     0x09,
     0x0A,
     0x0B,
     0x0C},
    {0x00,
     0xFF,
     0x01,
     0xFF,
     0x02,
     0x03,
     0x04,
     0xFF,
     0x05,
     0xFF,
     0x06,
     0x07,
     0x08,
     0x09,
     0x0A,
     0x0B},
    {0x00,
     0x01,
     0x02,
     0xFF,
     0x03,
     0x04,
     0x05,
     0xFF,
     0x06,
     0xFF,
     0x07,
     0x08,
     0x09,
     0x0A,
     0x0B,
     0x0C},
    {0x00,
     0xFF,
     0x01,
     0x02,
     0x03,
     0x04,
     0x05,
     0xFF,
     0x06,
     0xFF,
     0x07,
     0x08,
     0x09,
     0x0A,
     0x0B,
     0x0C},
    {0x00,
     0x01,
     0x02,
     0x03,
     0x04,
     0x05,
     0x06,
     0xFF,
     0x07,
     0xFF,
     0x08,
     0x09,
     0x0A,
     0x0B,
     0x0C,
     0x0D},
    {0x00,
     0xFF,
     0x01,
     0xFF,
     0x02,
     0xFF,
     0x03,
     0x04,
     0x05,
     0xFF,
     0x06,
     0x07,
     0x08,
     0x09,
     0x0A,
     0x0B},
    {0x00,
     0x01,
     0x02,
     0xFF,
     0x03,
     0xFF,
     0x04,
     0x05,
     0x06,
     0xFF,
     0x07,
     0x08,
     0x09,
     0x0A,
     0x0B,
     0x0C},
    {0x00,
     0xFF,
     0x01,
     0x02,
     0x03,
     0xFF,
     0x04,
     0x05,
     0x06,
     0xFF,
     0x07,
     0x08,
     0x09,
     0x0A,
     0x0B,
     0x0C},
    {0x00,
     0x01,
     0x02,
     0x03,
     0x04,
     0xFF,
     0x05,
     0x06,
     0x07,
     0xFF,
     0x08,
     0x09,
     0x0A,
     0x0B,
     0x0C,
     0x0D},
    {0x00,
     0xFF,
     0x01,
     0xFF,
     0x02,
     0x03,
     0x04,
     0x05,
     0x06,
     0xFF,
     0x07,
     0x08,
     0x09,
     0x0A,
     0x0B,
     0x0C},
    {0x00,
     0x01,
     0x02,
     0xFF,
     0x03,
     0x04,
     0x05,
     0x06,
     0x07,
     0xFF,
     0x08,
     0x09,
     0x0A,
     0x0B,
     0x0C,
     0x0D},
    {0x00,
     0xFF,
     0x01,
     0x02,
     0x03,
     0x04,
     0x05,
     0x06,
     0x07,
     0xFF,
     0x08,
     0x09,
     0x0A,
     0x0B,
     0x0C,
     0x0D},
    {0x00,
     0x01,
     0x02,
     0x03,
     0x04,
     0x05,
     0x06,
     0x07,
     0x08,
     0xFF,
     0x09,
     0x0A,
     0x0B,
     0x0C,
     0x0D,
     0x0E},
    {0x00,
     0xFF,
     0x01,
     0xFF,
     0x02,
     0xFF,
     0x03,
     0xFF,
     0x04,
     0x05,
     0x06,
     0x07,
     0x08,
     0x09,
     0x0A,
     0x0B},
    {0x00,
     0x01,
     0x02,
     0xFF,
     0x03,
     0xFF,
     0x04,
     0xFF,
     0x05,
     0x06,
     0x07,
     0x08,
     0x09,
     0x0A,
     0x0B,
     0x0C},
    {0x00,
     0xFF,
     0x01,
     0x02,
     0x03,
     0xFF,
     0x04,
     0xFF,
     0x05,
     0x06,
     0x07,
     0x08,
     0x09,
     0x0A,
     0x0B,
     0x0C},
    {0x00,
     0x01,
     0x02,
     0x03,
     0x04,
     0xFF,
     0x05,
     0xFF,
     0x06,
     0x07,
     0x08,
     0x09,
     0x0A,
     0x0B,
     0x0C,
     0x0D},
    {0x00,
     0xFF,
     0x01,
     0xFF,
     0x02,
     0x03,
     0x04,
     0xFF,
     0x05,
     0x06,
     0x07,
     0x08,
     0x09,
     0x0A,
     0x0B,
     0x0C},
    {0x00,
     0x01,
     0x02,
     0xFF,
     0x03,
     0x04,
     0x05,
     0xFF,
     0x06,
     0x07,
     0x08,
     0x09,
     0x0A,
     0x0B,
     0x0C,
     0x0D},
    {0x00,
     0xFF,
     0x01,
     0x02,
     0x03,
     0x04,
     0x05,
     0xFF,
     0x06,
     0x07,
     0x08,
     0x09,
     0x0A,
     0x0B,
     0x0C,
     0x0D},
    {0x00,
     0x01,
     0x02,
     0x03,
     0x04,
     0x05,
     0x06,
     0xFF,
     0x07,
     0x08,
     0x09,
     0x0A,
     0x0B,
     0x0C,
     0x0D,
     0x0E},
    {0x00,
     0xFF,
     0x01,
     0xFF,
     0x02,
     0xFF,
     0x03,
     0x04,
     0x05,
     0x06,
     0x07,
     0x08,
     0x09,
     0x0A,
     0x0B,
     0x0C},
    {0x00,
     0x01,
     0x02,
     0xFF,
     0x03,
     0xFF,
     0x04,
     0x05,
     0x06,
     0x07,
     0x08,
     0x09,
     0x0A,
     0x0B,
     0x0C,
     0x0D},
    {0x00,
     0xFF,
     0x01,
     0x02,
     0x03,
     0xFF,
     0x04,
     0x05,
     0x06,
     0x07,
     0x08,
     0x09,
     0x0A,
     0x0B,
     0x0C,
     0x0D},
    {0x00,
     0x01,
     0x02,
     0x03,
     0x04,
     0xFF,
     0x05,
     0x06,
     0x07,
     0x08,
     0x09,
     0x0A,
     0x0B,
     0x0C,
     0x0D,
     0x0E},
    {0x00,
     0xFF,
     0x01,
     0xFF,
     0x02,
     0x03,
     0x04,
     0x05,
     0x06,
     0x07,
     0x08,
     0x09,
     0x0A,
     0x0B,
     0x0C,
     0x0D},
    {0x00,
     0x01,
     0x02,
     0xFF,
     0x03,
     0x04,
     0x05,
     0x06,
     0x07,
     0x08,
     0x09,
     0x0A,
     0x0B,
     0x0C,
     0x0D,
     0x0E},
    {0x00,
     0xFF,
     0x01,
     0x02,
     0x03,
     0x04,
     0x05,
     0x06,
     0x07,
     0x08,
     0x09,
     0x0A,
     0x0B,
     0x0C,
     0x0D,
     0x0E},
    {0x00,
     0x01,
     0x02,
     0x03,
     0x04,
     0x05,
     0x06,
     0x07,
     0x08,
     0x09,
     0x0A,
     0x0B,
     0x0C,
     0x0D,
     0x0E,
     0x0F},
};

#endif


================================================
FILE: c++/pod5_format/svb16/simd_detect_x64.hpp
================================================
#pragma once

#include "common.hpp"  // architecture macros

#if defined(SVB16_X64)

#ifdef _MSC_VER
#include <intrin.h>
#endif

// __AVX__ is documented for MSVC, but __SSE4_1__ isn't
#if defined(__AVX__) || defined(__SSE4_1__)

inline constexpr bool has_ssse3() { return true; }

inline constexpr bool has_sse4_1() { return true; }

#else

struct CpuidResult {
    unsigned int eax;
    unsigned int ebx;
    unsigned int ecx;
    unsigned int edx;
};

inline CpuidResult cpuid(unsigned int leaf, unsigned int subleaf)
{
#ifdef _MSC_VER
    int info[4];
    __cpuidex(info, static_cast<int>(leaf), static_cast<int>(subleaf));
    return CpuidResult{
        static_cast<unsigned int>(info[0]),
        static_cast<unsigned int>(info[1]),
        static_cast<unsigned int>(info[2]),
        static_cast<unsigned int>(info[3]),
    };
#else
    CpuidResult info;
    asm("cpuid\n\t"
        : "=a"(info.eax), "=b"(info.ebx), "=c"(info.ecx), "=d"(info.edx)
        : "0"(leaf), "2"(subleaf));
    return info;
#endif
}

inline unsigned int cpuid_leaf1_ecx()
{
    // using C++11 atomic static variables
    static unsigned int const ecx = cpuid(1, 0).ecx;
    return ecx;
}

#if defined(__SSSE3__)
inline constexpr bool has_ssse3() { return true; }
#else
inline bool has_ssse3() { return (cpuid_leaf1_ecx() & (1 << 9)) != 0; }
#endif

inline bool has_sse4_1() { return (cpuid_leaf1_ecx() & (1 << 19)) != 0; }

#endif  // defined(__SSE4_1__)
#endif  // defined(SVB16_X64)


================================================
FILE: c++/pod5_format/svb16/streamvbytedelta_decode_16.c
================================================
#include "streamvbyte_isadetection.h"
#include "streamvbytedelta.h"

#include <string.h>  // for memcpy

static inline uint16_t zigzag_decode_16(uint16_t val)
{
    return (val >> 1) ^ (uint16_t)(0 - (val & 1));
}

static inline uint16_t _decode_data(uint8_t const ** dataPtrPtr, uint8_t code)
{
    uint8_t const * dataPtr = *dataPtrPtr;
    uint16_t val;

    if (code == 0) {  // 1 byte
        val = (uint16_t)*dataPtr;
        dataPtr += 1;
    } else {  // 2 bytes
        val = 0;
        memcpy(&val, dataPtr, 2);  // assumes little endian
        dataPtr += 2;
    }

    *dataPtrPtr = dataPtr;
    return val;
}

static uint8_t const * svb_decode_scalar_d1_init(
    uint16_t * outPtr,
    uint8_t const * keyPtr,
    uint8_t const * dataPtr,
    uint32_t count,
    uint16_t prev)
{
    if (count == 0) {
        return dataPtr;  // no reads or writes if no data
    }

    uint8_t shift = 0;
    uint16_t key = *keyPtr++;

    for (uint32_t c = 0; c < count; c++) {
        if (shift == 8) {
            shift = 0;
            key = *keyPtr++;
        }
        uint16_t val = zigzag_decode_16(_decode_data(&dataPtr, (key >> shift) & 0x1));
        //uint16_t val = _decode_data(&dataPtr, (key >> shift) & 0x1);
        val += prev;
        *outPtr++ = val;
        prev = val;
        shift += 1;
    }

    return dataPtr;  // pointer to first unused byte after end
}

#ifdef STREAMVBYTE_X64
#include "streamvbytedelta_x64_decode_16.c"
#endif

size_t streamvbyte_zigzag_delta_decode_16(
    uint8_t const * in,
    uint16_t * out,
    uint32_t count,
    uint16_t prev)
{
    // keyLen = ceil(count / 8), without overflowing (1 bit per input value):
    uint32_t keyLen = (count >> 3) + (((count & 7) + 7) >> 3);
    uint8_t const * keyPtr = in;
    uint8_t const * dataPtr = keyPtr + keyLen;  // data starts at end of keys
#ifdef STREAMVBYTE_X64
    if (streamvbyte_ssse3()) {
        return svb_decode_avx_d1_init(out, keyPtr, dataPtr, count, prev) - in;
    }
#endif
    return svb_decode_scalar_d1_init(out, keyPtr, dataPtr, count, prev) - in;
}


================================================
FILE: c++/pod5_format/svb16/streamvbytedelta_encode_16.c
================================================
#include "streamvbyte_isadetection.h"
#include "streamvbytedelta.h"

#include <stdio.h>
#include <string.h>  // for memcpy

#ifdef STREAMVBYTE_X64
#include "streamvbytedelta_x64_encode_16.c"
#endif

static inline uint16_t _zigzag_encode_16(uint16_t val)
{
    return (val + val) ^ ((int16_t)val >> 15);
}

static uint8_t _encode_data(uint16_t val, uint8_t * __restrict__ * dataPtrPtr)
{
    uint8_t * dataPtr = *dataPtrPtr;
    uint8_t code;

    if (val < (1 << 8)) {  // 1 byte
        *dataPtr = (uint8_t)(val);
        *dataPtrPtr += 1;
        code = 0;
    } else {                       // 2 bytes
        memcpy(dataPtr, &val, 2);  // assumes little endian
        *dataPtrPtr += 2;
        code = 1;
    }

    return code;
}

static uint8_t * svb_encode_scalar_d1_init(
    uint16_t const * in,
    uint8_t * __restrict__ keyPtr,
    uint8_t * __restrict__ dataPtr,
    uint32_t count,
    uint16_t prev)
{
    if (count == 0) {
        return dataPtr;  // exit immediately if no data
    }

    uint8_t shift = 0;  // cycles 0 through 7 then resets
    uint8_t key = 0;
    for (uint32_t c = 0; c < count; c++) {
        if (shift == 8) {
            shift = 0;
            *keyPtr++ = key;
            key = 0;
        }
        uint16_t val = _zigzag_encode_16((uint16_t)(in[c] - prev));
        //uint16_t val = in[c] - prev;
        prev = in[c];
        uint8_t code = _encode_data(val, &dataPtr);
        key |= code << shift;
        shift += 1;
    }

    *keyPtr = key;   // write last key (no increment needed)
    return dataPtr;  // pointer to first unused data byte
}

size_t streamvbyte_zigzag_delta_encode_16(
    uint16_t const * in,
    uint32_t count,
    uint8_t * out,
    uint16_t prev)
{
#ifdef STREAMVBYTE_X64
    if (streamvbyte_ssse3()) {
        return streamvbyte_zigzag_delta_encode_SSSE3_d1_init(in, count, out, prev);
    }
#endif
    uint8_t * keyPtr = out;  // keys come at start
    // keyLen = ceil(count / 8), without overflowing (1 bit per input value):
    uint32_t keyLen = (count >> 3) + (((count & 7) + 7) >> 3);
    uint8_t * dataPtr = keyPtr + keyLen;  // variable byte data after all keys
    return svb_encode_scalar_d1_init(in, keyPtr, dataPtr, count, prev) - out;
}


================================================
FILE: c++/pod5_format/svb16/streamvbytedelta_x64_decode_16.c
================================================
#include "streamvbyte_isadetection.h"
#include "streamvbyte_shuffle_tables_decode_16.h"

#include <string.h>  // for memcpy
#ifdef STREAMVBYTE_X64

STREAMVBYTE_TARGET_SSSE3
static __m128i undo_zigzag_16(__m128i buf)
{
    return _mm_xor_si128(
        // N >> 1
        _mm_srli_epi16(buf, 1),
        // 0xFFFF if N & 1 else 0x0000
        _mm_srai_epi16(_mm_slli_epi16(buf, 15), 15)
        // alternative: _mm_sign_epi16(ones, _mm_slli_epi16(buf, 15))
    );
}

STREAMVBYTE_UNTARGET_REGION

STREAMVBYTE_TARGET_SSSE3
static inline __m128i _decode_avx(uint32_t key, uint8_t const * __restrict__ * dataPtrPtr)
{
    uint8_t len = 8 + popcount(key);
    __m128i Data = _mm_loadu_si128((__m128i *)*dataPtrPtr);
    __m128i Shuf = *(__m128i *)&shuffleTable[key];

    Data = _mm_shuffle_epi8(Data, Shuf);
    *dataPtrPtr += len;

    return Data;
}

STREAMVBYTE_UNTARGET_REGION

STREAMVBYTE_TARGET_SSSE3
static inline void _write_avx(uint16_t * out, __m128i Vec)
{
    _mm_storeu_si128((__m128i *)out, Vec);
}

STREAMVBYTE_UNTARGET_REGION

STREAMVBYTE_TARGET_SSSE3
static inline __m128i _write_16bit_avx_d1(uint16_t * out, __m128i Vec, __m128i Prev)
{
#ifndef _MSC_VER
    __m128i BroadcastLast16 = {0x0F0E0F0E0F0E0F0E, 0x0F0E0F0E0F0E0F0E};
#else
    __m128i BroadcastLast16 = {14, 15, 14, 15, 14, 15, 14, 15, 14, 15, 14, 15, 14, 15, 14, 15};
#endif
    Vec = undo_zigzag_16(Vec);
    // vec == [A B C D E F G H] (16 bit values)
    __m128i Add = _mm_slli_si128(Vec, 2);            // [- A B C D E F G]
    Prev = _mm_shuffle_epi8(Prev, BroadcastLast16);  // [P P P P P P P P]
    Vec = _mm_add_epi16(Vec, Add);                   // [A AB BC CD DE FG GH]
    Add = _mm_slli_si128(Vec, 4);                    // [- - A AB BC CD DE EF]
    Vec = _mm_add_epi16(Vec, Add);                   // [A AB ABC ABCD BCDE CDEF DEFG EFGH]
    Add = _mm_slli_si128(Vec, 8);                    // [- - - - A AB ABC ABCD]
    Vec = _mm_add_epi16(Vec, Add);   // [A AB ABC ABCD ABCDE ABCDEF ABCDEFG ABCDEFGH]
    Vec = _mm_add_epi16(Vec, Prev);  // [PA PAB PABC PABCD PABCDE PABCDEF PABCDEFG PABCDEFGH]
    _write_avx(out, Vec);
    return Vec;
}

STREAMVBYTE_UNTARGET_REGION

STREAMVBYTE_TARGET_SSSE3
static uint8_t const * svb_decode_avx_d1_init(
    uint16_t * out,
    uint8_t const * __restrict__ keyPtr,
    uint8_t const * __restrict__ dataPtr,
    uint64_t count,
    uint16_t prev)
{
    uint64_t keybytes = count / 4;  // number of key bytes
    if (keybytes >= 8) {
        __m128i Prev = _mm_set1_epi16(prev);
        __m128i Data;

        int64_t Offset = -(int64_t)keybytes / 8 + 1;

        uint64_t const * keyPtr64 = (uint64_t const *)keyPtr - Offset;
        uint64_t nextkeys;
        memcpy(&nextkeys, keyPtr64 + Offset, sizeof(nextkeys));
        for (; Offset != 0; ++Offset) {
            uint64_t keys = nextkeys;
            memcpy(&nextkeys, keyPtr64 + Offset + 1, sizeof(nextkeys));
            // faster 16-bit delta since we only have 8-bit values
            if (!keys) {  // 32 1-byte ints in a row

                // _mm_cvtepu8_epi16: SSE4.1
                Data = _mm_cvtepu8_epi16(_mm_lddqu_si128((__m128i *)(dataPtr)));
                Prev = _write_16bit_avx_d1(out, Data, Prev);
                Data = _mm_cvtepu8_epi16(_mm_lddqu_si128((__m128i *)(dataPtr + 8)));
                Prev = _write_16bit_avx_d1(out + 8, Data, Prev);
                Data = _mm_cvtepu8_epi16(_mm_lddqu_si128((__m128i *)(dataPtr + 16)));
                Prev = _write_16bit_avx_d1(out + 16, Data, Prev);
                Data = _mm_cvtepu8_epi16(_mm_lddqu_si128((__m128i *)(dataPtr + 24)));
                Prev = _write_16bit_avx_d1(out + 24, Data, Prev);
                out += 32;
                dataPtr += 32;
                continue;
            }

            Data = _decode_avx(keys & 0x00FF, &dataPtr);
            Prev = _write_16bit_avx_d1(out, Data, Prev);
            Data = _decode_avx((keys & 0xFF00) >> 8, &dataPtr);
            Prev = _write_16bit_avx_d1(out + 4, Data, Prev);

            keys >>= 16;
            Data = _decode_avx((keys & 0x00FF), &dataPtr);
            Prev = _write_16bit_avx_d1(out + 8, Data, Prev);
            Data = _decode_avx((keys & 0xFF00) >> 8, &dataPtr);
            Prev = _write_16bit_avx_d1(out + 12, Data, Prev);

            keys >>= 16;
            Data = _decode_avx((keys & 0x00FF), &dataPtr);
            Prev = _write_16bit_avx_d1(out + 16, Data, Prev);
            Data = _decode_avx((keys & 0xFF00) >> 8, &dataPtr);
            Prev = _write_16bit_avx_d1(out + 20, Data, Prev);

            keys >>= 16;
            Data = _decode_avx((keys & 0x00FF), &dataPtr);
            Prev = _write_16bit_avx_d1(out + 24, Data, Prev);
            Data = _decode_avx((keys & 0xFF00) >> 8, &dataPtr);
            Prev = _write_16bit_avx_d1(out + 28, Data, Prev);

            out += 32;
        }
        {
            uint64_t keys = nextkeys;
            // faster 16-bit delta since we only have 8-bit values
            if (!keys) {  // 32 1-byte ints in a row
                Data = _mm_cvtepu8_epi16(_mm_lddqu_si128((__m128i *)(dataPtr)));
                Prev = _write_16bit_avx_d1(out, Data, Prev);
                Data = _mm_cvtepu8_epi16(_mm_lddqu_si128((__m128i *)(dataPtr + 8)));
                Prev = _write_16bit_avx_d1(out + 8, Data, Prev);
                Data = _mm_cvtepu8_epi16(_mm_lddqu_si128((__m128i *)(dataPtr + 16)));
                Prev = _write_16bit_avx_d1(out + 16, Data, Prev);
                Data = _mm_cvtepu8_epi16(_mm_loadl_epi64((__m128i *)(dataPtr + 24)));
                Prev = _write_16bit_avx_d1(out + 24, Data, Prev);
                out += 32;
                dataPtr += 32;

            } else {
                Data = _decode_avx(keys & 0x00FF, &dataPtr);
                Prev = _write_16bit_avx_d1(out, Data, Prev);
                Data = _decode_avx((keys & 0xFF00) >> 8, &dataPtr);
                Prev = _write_16bit_avx_d1(out + 4, Data, Prev);

                keys >>= 16;
                Data = _decode_avx((keys & 0x00FF), &dataPtr);
                Prev = _write_16bit_avx_d1(out + 8, Data, Prev);
                Data = _decode_avx((keys & 0xFF00) >> 8, &dataPtr);
                Prev = _write_16bit_avx_d1(out + 12, Data, Prev);

                keys >>= 16;
                Data = _decode_avx((keys & 0x00FF), &dataPtr);
                Prev = _write_16bit_avx_d1(out + 16, Data, Prev);
                Data = _decode_avx((keys & 0xFF00) >> 8, &dataPtr);
                Prev = _write_16bit_avx_d1(out + 20, Data, Prev);

                keys >>= 16;
                Data = _decode_avx((keys & 0x00FF), &dataPtr);
                Prev = _write_16bit_avx_d1(out + 24, Data, Prev);
                Data = _decode_avx((keys & 0xFF00) >> 8, &dataPtr);
                Prev = _write_16bit_avx_d1(out + 28, Data, Prev);

                out += 32;
            }
        }
        prev = out[-1];
    }
    uint64_t consumedkeys = keybytes - (keybytes & 7);
    return svb_decode_scalar_d1_init(out, keyPtr + consumedkeys, dataPtr, count & 31, prev);
}

STREAMVBYTE_UNTARGET_REGION
#endif


================================================
FILE: c++/pod5_format/svb16/streamvbytedelta_x64_encode_16.c
================================================

#include "streamvbyte_isadetection.h"
#include "streamvbyte_shuffle_tables_encode_16.h"

#include <stdio.h>
#include <string.h>

#ifdef STREAMVBYTE_X64

STREAMVBYTE_TARGET_SSSE3
static __m128i Delta(__m128i curr, __m128i prev)
{
    // _mm_alignr_epi8: SSSE3
    return _mm_sub_epi16(curr, _mm_alignr_epi8(curr, prev, 14));
}

STREAMVBYTE_UNTARGET_REGION

STREAMVBYTE_TARGET_SSSE3
static __m128i zigzag_16(__m128i buf)
{
    return _mm_xor_si128(_mm_add_epi16(buf, buf), _mm_srai_epi16(buf, 16));
}

STREAMVBYTE_UNTARGET_REGION

// based on code by aqrit  (streamvbyte_encode_SSSE3)
STREAMVBYTE_TARGET_SSSE3
size_t streamvbyte_zigzag_delta_encode_SSSE3_d1_init(
    uint16_t const * in,
    uint32_t count,
    uint8_t * out,
    uint16_t prev)
{
    __m128i Prev = _mm_set1_epi16(prev);
    uint32_t keyLen = (count >> 3) + (((count & 7) + 7) >> 3);  // 1-bit rounded to full byte
    uint8_t * restrict keyPtr = &out[0];
    uint8_t * restrict dataPtr = &out[keyLen];  // variable length data after keys

    __m128i const mask_01 = _mm_set1_epi8(0x01);

    for (uint16_t const * end = &in [(count & ~15)]; in != end; in += 16) {
        __m128i rawr0, r0, rawr1, r1, r2, r3;
        size_t keys;

        rawr0 = _mm_loadu_si128((__m128i *)&in[0]);
        r0 = zigzag_16(Delta(rawr0, Prev));
        Prev = rawr0;
        rawr1 = _mm_loadu_si128((__m128i *)&in[8]);
        r1 = zigzag_16(Delta(rawr1, Prev));
        Prev = rawr1;

        // 1 if the byte is set, 0 if not
        r2 = _mm_min_epu8(mask_01, r0);
        r3 = _mm_min_epu8(mask_01, r1);
        // for each (u)int16, FF if the MSB is set, 00 or 01 if not (us = unsigned saturation)
        r2 = _mm_packus_epi16(r2, r3);
        // for each byte, store a bit: 1 if FF, 0 if 00 or 01 (so 1 if MSB is set, 0 if not)
        keys = (size_t)_mm_movemask_epi8(r2);

        r2 = _mm_loadu_si128((__m128i *)&shuf_lut[(keys << 4) & 0x07F0]);
        r3 = _mm_loadu_si128((__m128i *)&shuf_lut[(keys >> 4) & 0x07F0]);
        // _mm_shuffle_epi8: SSSE3
        r0 = _mm_shuffle_epi8(r0, r2);
        r1 = _mm_shuffle_epi8(r1, r3);

        _mm_storeu_si128((__m128i *)dataPtr, r0);
        dataPtr += 8 + popcount(keys & 0xFF);
        _mm_storeu_si128((__m128i *)dataPtr, r1);
        dataPtr += 8 + popcount(keys >> 8);

        *((uint16_t *)keyPtr) = (uint16_t)keys;
        keyPtr += 2;
    }
    prev = _mm_extract_epi16(Prev, 7);

    // do remaining - max two control bytes left
    uint16_t key = 0;
    for (size_t i = 0; i < (count & 15); i++) {
        // TODO: can we factor this out to reuse the non-intrinsic code?
        uint16_t dw = in[i] - prev;
        prev = in[i];
        uint16_t zz = (dw + dw) ^ ((int16_t)dw >> 15);
        uint16_t symbol = (zz > 0x00FF);
        key |= symbol << (i + i);
        *((uint16_t *)dataPtr) = zz;
        dataPtr += 1 + symbol;
    }
    memcpy(keyPtr, &key, ((count & 15) + 5) >> 3);

    return dataPtr - out;
}

STREAMVBYTE_UNTARGET_REGION
#endif


================================================
FILE: c++/pod5_format/svb16/svb16.c
================================================


================================================
FILE: c++/pod5_format/svb16/svb16.h
================================================
#ifndef SVB16_H
#define SVB16_H

#include <stdint.h>

#if defined(__cplusplus)
extern "C" {
#endif

/// Get the number of key bytes required to encode a given number of 16-bit integers.
inline uint32_t svb16_key_length(uint32_t count)
{
    // ceil(count / 8.0), without overflowing or using fp arithmetic
    return (count >> 3) + (((count & 7) + 7) >> 3);
}

/// Get the maximum number of bytes required to encode a given number of 16-bit integers.
inline uint32_t svb16_max_encoded_length(uint32_t count)
{
    return svb16_key_length(count) + (2 * count);
}

#if defined(__cplusplus)
};
#endif

#endif  // SVB16_H


================================================
FILE: c++/pod5_format/table_reader.cpp
================================================
#include "pod5_format/table_reader.h"

#include <arrow/ipc/reader.h>
#include <arrow/record_batch.h>
#include <arrow/util/align_util.h>

namespace pod5 {

TableRecordBatch::TableRecordBatch(std::shared_ptr<arrow::RecordBatch> const & batch)
: m_batch(batch)
{
}

TableRecordBatch::TableRecordBatch(std::shared_ptr<arrow::RecordBatch> && batch)
: m_batch(std::move(batch))
{
}

TableRecordBatch::TableRecordBatch(TableRecordBatch const &) = default;
TableRecordBatch & TableRecordBatch::operator=(TableRecordBatch const &) = default;
TableRecordBatch::TableRecordBatch(TableRecordBatch &&) = default;
TableRecordBatch & TableRecordBatch::operator=(TableRecordBatch &&) = default;
TableRecordBatch::~TableRecordBatch() = default;

std::size_t TableRecordBatch::num_rows() const { return m_batch->num_rows(); }

//---------------------------------------------------------------------------------------------------------------------

TableReader::TableReader(
    std::shared_ptr<void> && input_source,
    std::shared_ptr<arrow::ipc::RecordBatchFileReader> && reader,
    SchemaMetadataDescription && schema_metadata,
    arrow::MemoryPool * pool)
: m_input_source(std::move(input_source))
, m_reader(std::move(reader))
, m_schema_metadata(std::move(schema_metadata))
{
}

TableReader::TableReader(TableReader &&) = default;
TableReader & TableReader::operator=(TableReader &&) = default;
TableReader::~TableReader() = default;

std::size_t TableReader::num_record_batches() const { return m_reader->num_record_batches(); }

Result<int64_t> TableReader::CountRows() const { return m_reader->CountRows(); }

Result<std::shared_ptr<arrow::RecordBatch>> TableReader::ReadRecordBatch(int i) const
{
    return ReadRecordBatchAndValidate(*m_reader, i);
}

Result<std::shared_ptr<arrow::RecordBatch>> ReadRecordBatchAndValidate(
    arrow::ipc::RecordBatchFileReader & reader,
    int i)
{
    ARROW_ASSIGN_OR_RAISE(auto batch, reader.ReadRecordBatch(i));
    ARROW_RETURN_NOT_OK(batch->ValidateFull());

    // Check that the data buffers are aligned.
    std::vector<bool> unaligned_columns;
    unaligned_columns.reserve(batch->num_columns());
    if (!arrow::util::CheckAlignment(*batch, arrow::util::kValueAlignment, &unaligned_columns)) {
        return Status::Invalid("Column data alignment check failed");
    }

    return batch;
}

}  // namespace pod5


================================================
FILE: c++/pod5_format/table_reader.h
================================================
#pragma once

#include "pod5_format/pod5_format_export.h"
#include "pod5_format/schema_metadata.h"

#include <memory>

namespace arrow {
class MemoryPool;
class RecordBatch;

namespace ipc {
class RecordBatchFileReader;
}
}  // namespace arrow

namespace pod5 {

class POD5_FORMAT_EXPORT TableRecordBatch {
public:
    TableRecordBatch(std::shared_ptr<arrow::RecordBatch> const & batch);
    TableRecordBatch(std::shared_ptr<arrow::RecordBatch> && batch);

    TableRecordBatch(TableRecordBatch &&);
    TableRecordBatch & operator=(TableRecordBatch &&);
    TableRecordBatch(TableRecordBatch const &);
    TableRecordBatch & operator=(TableRecordBatch const &);
    ~TableRecordBatch();

    std::size_t num_rows() const;

    std::shared_ptr<arrow::RecordBatch> const & batch() const { return m_batch; }

private:
    std::shared_ptr<arrow::RecordBatch> m_batch;
};

class POD5_FORMAT_EXPORT TableReader {
public:
    TableReader(
        std::shared_ptr<void> && input_source,
        std::shared_ptr<arrow::ipc::RecordBatchFileReader> && reader,
        SchemaMetadataDescription && schema_metadata,
        arrow::MemoryPool * pool);
    TableReader(TableReader &&);
    TableReader & operator=(TableReader &&);
    TableReader(TableReader const &) = delete;
    TableReader & operator=(TableReader const &) = delete;
    ~TableReader();

    SchemaMetadataDescription const & schema_metadata() const { return m_schema_metadata; }

    std::size_t num_record_batches() const;

    Result<int64_t> CountRows() const;

    Result<std::shared_ptr<arrow::RecordBatch>> ReadRecordBatch(int i) const;

private:
    std::shared_ptr<void> m_input_source;
    std::shared_ptr<arrow::ipc::RecordBatchFileReader> m_reader;
    SchemaMetadataDescription m_schema_metadata;
};

// Same as RecordBatchFileReader::ReadRecordBatch() but validates the contents.
Result<std::shared_ptr<arrow::RecordBatch>> ReadRecordBatchAndValidate(
    arrow::ipc::RecordBatchFileReader & reader,
    int i);

}  // namespace pod5


================================================
FILE: c++/pod5_format/thread_pool.cpp
================================================
#include "pod5_format/thread_pool.h"

#include <atomic>
#include <cassert>
#include <condition_variable>
#include <deque>
#include <mutex>
#include <optional>
#include <stdexcept>
#include <thread>
#include <vector>

namespace pod5 {

namespace {

class ThreadPoolImpl : public ThreadPool, public std::enable_shared_from_this<ThreadPoolImpl> {
public:
    ThreadPoolImpl(std::size_t worker_count)
    {
        assert(worker_count > 0);
        for (std::size_t i = 0; i < std::max<std::size_t>(1, worker_count); ++i) {
            m_threads.emplace_back([&] { run_thread(); });
        }
    }

    ~ThreadPoolImpl() { stop_and_drain(); }

    void run_thread()
    {
        bool keep_alive = true;
        std::optional<WorkItem> work;

        while (keep_alive) {
            {
                std::unique_lock<std::mutex> lock{m_work_mutex};

                if (work) {
                    if (work->strand_id != NO_STRAND) {
                        m_busy_strands[work->strand_id] = false;
                    }
                    work = std::nullopt;
                }

                // find the first piece of work whose strand isn't already busy
                for (auto it = m_work.begin(); it != m_work.end(); ++it) {
                    if (it->strand_id == NO_STRAND || !m_busy_strands.at(it->strand_id)) {
                        if (it->strand_id != NO_STRAND) {
                            m_busy_strands[it->strand_id] = true;
                        }
                        work = std::move(*it);
                        m_work.erase(it);
                        break;
                    }
                }

                if (!work) {
                    if (m_keep_alive) {
                        m_work_ready.wait(lock);
                        keep_alive = m_keep_alive || !m_work.empty();
                    } else {
                        // If there wasn't any work for us to pick up, any remaining work must be
                        // for strands with running tasks (in which case the workers handling those
                        // tasks will pick them up. This will work because once a task finishes, the
                        // worker will check for work *before* checking m_keep_alive. Thus it's safe
                        // for *this* worker to exit.
                        keep_alive = false;
                    }
                    continue;
                }
            }
            assert(work);

            if (work->callback) {
                work->callback();
            }
        }
    }

    void post(std::function<void()> callback) override
    {
        {
            std::lock_guard<std::mutex> l{m_work_mutex};
            if (!m_keep_alive) {
                throw std::logic_error{"ThreadPool: post() called after stop_and_drain()"};
            }
            m_work.emplace_back(WorkItem{std::move(callback), NO_STRAND});
        }

        m_work_ready.notify_one();
    }

    void post(std::function<void()> callback, uint64_t const strand_id)
    {
        assert(strand_id != NO_STRAND);

        std::lock_guard<std::mutex> l{m_work_mutex};
        if (!m_keep_alive) {
            throw std::logic_error{"ThreadPool: post() called after stop_and_drain()"};
        }
        if (m_busy_strands.size() <= strand_id) {
            m_busy_strands.resize(strand_id + 1);
        }
        m_work.emplace_back(WorkItem{std::move(callback), strand_id});

        // only send a wakeup if the strand isn't already busy - it's generally more efficient to do
        // this outside the lock, but the conditional makes that hard to reason about
        if (!m_busy_strands.at(strand_id)) {
            m_work_ready.notify_one();
        }
    }

    void stop_and_drain() override
    {
        {
            std::lock_guard<std::mutex> lock{m_work_mutex};
            m_keep_alive = false;
        }
        m_work_ready.notify_all();
        for (auto & thread : m_threads) {
            if (thread.joinable()) {
                thread.join();
            }
        }

        assert(m_work.empty());
    }

    void wait_for_drain() override
    {
        auto const drained = [&]() {
            std::lock_guard<std::mutex> lock{m_work_mutex};
            return m_work.empty();
        };
        while (!drained()) {
            m_work_ready.notify_all();
            std::this_thread::sleep_for(std::chrono::milliseconds{10});
        }
    }

    std::shared_ptr<ThreadPoolStrand> create_strand() override;

private:
    struct WorkItem {
        std::function<void()> callback;
        uint64_t strand_id;

        explicit operator bool() const { return !!callback; }
    };

    static constexpr uint64_t NO_STRAND = UINT64_MAX;

    std::mutex m_work_mutex;
    bool m_keep_alive{true};
    std::condition_variable m_work_ready;
    std::deque<WorkItem> m_work;
    std::vector<bool> m_busy_strands;

    std::atomic<uint64_t> m_next_strand_id{0};
    std::vector<std::thread> m_threads;
};

class StrandImpl : public ThreadPoolStrand {
public:
    StrandImpl(std::shared_ptr<ThreadPoolImpl> pool, uint64_t const strand_id)
    : m_pool(std::move(pool))
    , m_strand_id(strand_id)
    {
    }

    void post(std::function<void()> callback) override
    {
        m_pool->post(std::move(callback), m_strand_id);
    }

    std::shared_ptr<ThreadPoolImpl> m_pool;
    uint64_t m_strand_id;
};

std::shared_ptr<ThreadPoolStrand> ThreadPoolImpl::create_strand()
{
    uint64_t strand_id;
    {
        std::lock_guard<std::mutex> l{m_work_mutex};
        if (!m_keep_alive) {
            throw std::logic_error{"ThreadPool: create_strand() called after stop_and_drain()"};
        }
        strand_id = m_next_strand_id++;
    }
    return std::make_shared<StrandImpl>(shared_from_this(), strand_id);
}
}  // namespace

std::shared_ptr<ThreadPool> make_thread_pool(std::size_t worker_threads)
{
    return std::make_shared<ThreadPoolImpl>(worker_threads);
}

}  // namespace pod5


================================================
FILE: c++/pod5_format/thread_pool.h
================================================
#pragma once

#include "pod5_format/pod5_format_export.h"

#include <functional>
#include <memory>

namespace pod5 {

class POD5_FORMAT_EXPORT ThreadPoolStrand {
public:
    virtual ~ThreadPoolStrand() = default;
    virtual void post(std::function<void()> callback) = 0;
};

class POD5_FORMAT_EXPORT ThreadPool {
public:
    virtual ~ThreadPool() = default;
    virtual std::shared_ptr<ThreadPoolStrand> create_strand() = 0;
    virtual void post(std::function<void()> callback) = 0;
    /// Stops the thread pool and drains all active work.
    ///
    /// Further calls to create_strand() or post() (including on an existing strand created from
    /// this pool) will throw.
    virtual void stop_and_drain() = 0;

    /// Waits for the threads to process all posted work.
    virtual void wait_for_drain() = 0;
};

POD5_FORMAT_EXPORT std::shared_ptr<ThreadPool> make_thread_pool(std::size_t worker_threads);
}  // namespace pod5


================================================
FILE: c++/pod5_format/tuple_utils.h
================================================
#pragma once

#include <tuple>
#include <utility>

namespace pod5 { namespace detail {

template <typename T, typename F, int... Is>
void for_each(T && t, F f, std::integer_sequence<int, Is...>)
{
    auto l = {(f(std::get<Is>(t), Is), 0)...};
    (void)l;
}

template <typename... Ts, typename F>
void for_each_in_tuple(std::tuple<Ts...> & t, F f)
{
    detail::for_each(t, f, std::make_integer_sequence<int, sizeof...(Ts)>());
}

template <typename T1, typename T2, typename F, int... Is>
void for_each_zipped(T1 && t1, T2 && t2, F f, std::integer_sequence<int, Is...>)
{
    auto l = {(f(std::get<Is>(t1), std::get<Is>(t2), Is), 0)...};
    (void)l;
}

template <typename T1, typename T2, typename F>
void for_each_in_tuple_zipped(T1 & t1, T2 & t2, F f)
{
    static_assert(
        std::tuple_size<T1>::value == std::tuple_size<T2>::value, "Tuples must be same size");
    detail::for_each_zipped(
        t1, t2, f, std::make_integer_sequence<int, std::tuple_size<T1>::value>());
}

}}  // namespace pod5::detail


================================================
FILE: c++/pod5_format/types.cpp
================================================
#include "pod5_format/types.h"

#include <arrow/array/array_binary.h>
#include <arrow/array/builder_binary.h>
#include <arrow/util/logging.h>

#include <mutex>

namespace pod5 {

Uuid const * UuidArray::raw_values() const
{
    auto const & array = static_cast<arrow::FixedSizeBinaryArray const &>(*storage_);
    return reinterpret_cast<Uuid const *>(array.GetValue(0));
}

Uuid UuidArray::Value(int64_t i) const
{
    auto const & array = static_cast<arrow::FixedSizeBinaryArray const &>(*storage_);
    return *reinterpret_cast<Uuid const *>(array.GetValue(i));
}

bool UuidType::ExtensionEquals(ExtensionType const & other) const
{
    // no parameters to consider
    return other.extension_name() == extension_name();
}

std::shared_ptr<arrow::Array> UuidType::MakeArray(std::shared_ptr<arrow::ArrayData> data) const
{
    DCHECK_EQ(data->type->id(), arrow::Type::EXTENSION);
    DCHECK_EQ(
        static_cast<arrow::ExtensionType const &>(*data->type).extension_name(), extension_name());
    return std::make_shared<UuidArray>(data);
}

std::string UuidType::Serialize() const { return ""; }

arrow::Result<std::shared_ptr<arrow::DataType>> UuidType::Deserialize(
    std::shared_ptr<arrow::DataType> storage_type,
    std::string const & serialized_data) const
{
    if (serialized_data != "") {
        return arrow::Status::Invalid("Unexpected type metadata: '", serialized_data, "'");
    }
    if (!storage_type->Equals(*arrow::fixed_size_binary(16))) {
        return arrow::Status::Invalid(
            "Incorrect storage for UuidType: '", storage_type->ToString(), "'");
    }
    return std::make_shared<UuidType>();
}

gsl::span<std::uint8_t const> VbzSignalArray::Value(int64_t i) const
{
    auto const & array = static_cast<arrow::LargeBinaryArray const &>(*storage_);

    arrow::LargeBinaryArray::offset_type value_length = 0;
    auto value_ptr = array.GetValue(i, &value_length);
    return gsl::make_span(value_ptr, value_length);
}

std::shared_ptr<arrow::Buffer> VbzSignalArray::ValueAsBuffer(int64_t i) const
{
    auto const & array = static_cast<arrow::LargeBinaryArray const &>(*storage_);

    auto offset = array.value_offset(i);
    auto length = array.value_length(i);
    auto const value_data = array.value_data();

    return arrow::SliceBuffer(value_data, offset, length);
}

bool VbzSignalType::ExtensionEquals(ExtensionType const & other) const
{
    // no parameters to consider
    return other.extension_name() == extension_name();
}

std::shared_ptr<arrow::Array> VbzSignalType::MakeArray(std::shared_ptr<arrow::ArrayData> data) const
{
    DCHECK_EQ(data->type->id(), arrow::Type::EXTENSION);
    DCHECK_EQ(
        static_cast<arrow::ExtensionType const &>(*data->type).extension_name(), extension_name());
    return std::make_shared<VbzSignalArray>(data);
}

std::string VbzSignalType::Serialize() const { return ""; }

arrow::Result<std::shared_ptr<arrow::DataType>> VbzSignalType::Deserialize(
    std::shared_ptr<arrow::DataType> storage_type,
    std::string const & serialized_data) const
{
    if (serialized_data != "") {
        return arrow::Status::Invalid("Unexpected type metadata: '", serialized_data, "'");
    }
    if (!storage_type->Equals(*arrow::large_binary())) {
        return arrow::Status::Invalid(
            "Incorrect storage for VbzSignalType: '", storage_type->ToString(), "'");
    }
    return std::make_shared<VbzSignalType>();
}

std::unique_ptr<arrow::FixedSizeBinaryBuilder> make_read_id_builder(arrow::MemoryPool * pool)
{
    auto const & uuid_type = uuid();
    assert(uuid_type->id() == arrow::Type::EXTENSION);
    auto result = std::make_unique<arrow::FixedSizeBinaryBuilder>(uuid_type->storage_type(), pool);
    assert(result->byte_width() == 16);
    return result;
}

std::shared_ptr<VbzSignalType> const & vbz_signal()
{
    static auto vbz_signal = std::make_shared<VbzSignalType>();
    return vbz_signal;
}

std::shared_ptr<UuidType> const & uuid()
{
    static auto uuid = std::make_shared<UuidType>();
    return uuid;
}

namespace {

std::mutex & get_pod5_register_mutex()
{
    // Heap allocated so that it's safe for user code to call during static init
    // and destruction, not that they should.
    static std::mutex & m = *new std::mutex{};
    return m;
}

std::size_t s_pod5_register_count(0);

}  // namespace

pod5::Status register_extension_types()
{
    std::lock_guard lock(get_pod5_register_mutex());
    if (++s_pod5_register_count == 1) {
        ARROW_RETURN_NOT_OK(arrow::RegisterExtensionType(uuid()));
        ARROW_RETURN_NOT_OK(arrow::RegisterExtensionType(vbz_signal()));
    }
    return pod5::Status::OK();
}

pod5::Status unregister_extension_types()
{
    std::lock_guard lock(get_pod5_register_mutex());
    auto register_count = --s_pod5_register_count;
    if (register_count == 0) {
        if (arrow::GetExtensionType("minknow.uuid")) {
            ARROW_RETURN_NOT_OK(arrow::UnregisterExtensionType("minknow.uuid"));
        }
        if (arrow::GetExtensionType("minknow.vbz")) {
            ARROW_RETURN_NOT_OK(arrow::UnregisterExtensionType("minknow.vbz"));
        }
    }
    return pod5::Status::OK();
}

bool check_extension_types_registered()
{
    std::lock_guard lock(get_pod5_register_mutex());
    return s_pod5_register_count > 0;
}

}  // namespace pod5


================================================
FILE: c++/pod5_format/types.h
================================================
#pragma once

#include "pod5_format/pod5_format_export.h"
#include "pod5_format/result.h"
#include "pod5_format/uuid.h"

#include <arrow/extension_type.h>
#include <arrow/stl_iterator.h>
#include <gsl/gsl-lite.hpp>

namespace pod5 {

class POD5_FORMAT_EXPORT UuidArray : public arrow::ExtensionArray {
public:
    using IteratorType = arrow::stl::ArrayIterator<UuidArray>;

    using ExtensionArray::ExtensionArray;

    Uuid const * raw_values() const;

    Uuid Value(int64_t i) const;

    // this isn't actually a view - it copies the data - but
    // (a) it's only 16 bytes, which is what a view (pointer + size) would require anyway
    // (b) arrow::std::ArrayIterator hard-codes the name of this method (even though it is supposed
    //     to be configurable via the ValueAccessor template parameter)
    Uuid GetView(int64_t i) const { return Value(i); }

    std::optional<Uuid> operator[](int64_t i) const { return *IteratorType(*this, i); }

    IteratorType begin() const { return IteratorType(*this); }

    IteratorType end() const { return IteratorType(*this, length()); }
};

class POD5_FORMAT_EXPORT UuidType : public arrow::ExtensionType {
public:
    UuidType() : ExtensionType(arrow::fixed_size_binary(16)) {}

    std::string extension_name() const override { return "minknow.uuid"; }

    bool ExtensionEquals(ExtensionType const & other) const override;
    std::shared_ptr<arrow::Array> MakeArray(std::shared_ptr<arrow::ArrayData> data) const override;
    std::string Serialize() const override;
    arrow::Result<std::shared_ptr<arrow::DataType>> Deserialize(
        std::shared_ptr<arrow::DataType> storage_type,
        std::string const & serialized_data) const override;
};

class POD5_FORMAT_EXPORT VbzSignalArray : public arrow::ExtensionArray {
public:
    using IteratorType = arrow::stl::ArrayIterator<VbzSignalArray>;

    gsl::span<std::uint8_t const> Value(int64_t i) const;
    std::shared_ptr<arrow::Buffer> ValueAsBuffer(int64_t i) const;

    using ExtensionArray::ExtensionArray;
};

class POD5_FORMAT_EXPORT VbzSignalType : public arrow::ExtensionType {
public:
    VbzSignalType() : ExtensionType(arrow::large_binary()) {}

    std::string extension_name() const override { return "minknow.vbz"; }

    bool ExtensionEquals(ExtensionType const & other) const override;
    std::shared_ptr<arrow::Array> MakeArray(std::shared_ptr<arrow::ArrayData> data) const override;
    std::string Serialize() const override;
    arrow::Result<std::shared_ptr<arrow::DataType>> Deserialize(
        std::shared_ptr<arrow::DataType> storage_type,
        std::string const & serialized_data) const override;
};

std::unique_ptr<arrow::FixedSizeBinaryBuilder> make_read_id_builder(arrow::MemoryPool * pool);

std::shared_ptr<VbzSignalType> const & vbz_signal();
std::shared_ptr<UuidType> const & uuid();

/// \brief Register all required extension types.
POD5_FORMAT_EXPORT pod5::Status register_extension_types();

/// \brief Unregister all required extension types.
POD5_FORMAT_EXPORT pod5::Status unregister_extension_types();

/// \brief Returns true iff the required extension types are registered.
/// \details The caller can expect the extension types to be registered if the number of calls to
/// `register_extension_types` exceeds the number of calls to `unregister_extension_types`.
bool check_extension_types_registered();

}  // namespace pod5


================================================
FILE: c++/pod5_format/uuid.h
================================================
#pragma once

// This file contains code from https://github.com/mariusbancila/stduuid/ which has the following
// license:
//
//   MIT License
//
//   Copyright (c) 2017
//
//   Permission is hereby granted, free of charge, to any person obtaining a copy
//   of this software and associated documentation files (the "Software"), to deal
//   in the Software without restriction, including without limitation the rights
//   to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
//   copies of the Software, and to permit persons to whom the Software is
//   furnished to do so, subject to the following conditions:
//
//   The above copyright notice and this permission notice shall be included in all
//   copies or substantial portions of the Software.
//
//   THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
//   IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
//   FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
//   AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
//   LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
//   OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
//   SOFTWARE.

#include <array>
#include <cstdint>
#include <iosfwd>
#include <optional>
#include <random>
#include <string>
#include <string_view>

namespace pod5 {

namespace uuid_detail {

template <typename TChar>
[[nodiscard]] constexpr inline unsigned char hex2char(TChar const ch) noexcept
{
    if (ch >= static_cast<TChar>('0') && ch <= static_cast<TChar>('9')) {
        return static_cast<unsigned char>(ch - static_cast<TChar>('0'));
    }
    if (ch >= static_cast<TChar>('a') && ch <= static_cast<TChar>('f')) {
        return static_cast<unsigned char>(10 + ch - static_cast<TChar>('a'));
    }
    if (ch >= static_cast<TChar>('A') && ch <= static_cast<TChar>('F')) {
        return static_cast<unsigned char>(10 + ch - static_cast<TChar>('A'));
    }
    return 0;
}

template <typename TChar>
[[nodiscard]] constexpr inline bool is_hex(TChar const ch) noexcept
{
    return (ch >= static_cast<TChar>('0') && ch <= static_cast<TChar>('9'))
           || (ch >= static_cast<TChar>('a') && ch <= static_cast<TChar>('f'))
           || (ch >= static_cast<TChar>('A') && ch <= static_cast<TChar>('F'));
}

template <typename TChar>
[[nodiscard]] constexpr std::basic_string_view<TChar> to_string_view(TChar const * str) noexcept
{
    if (str) {
        return str;
    }
    return {};
}

template <typename StringType>
[[nodiscard]] constexpr std::
    basic_string_view<typename StringType::value_type, typename StringType::traits_type>
    to_string_view(StringType const & str) noexcept
{
    return str;
}

template <typename CharT>
inline constexpr CharT empty_guid[37] = "00000000-0000-0000-0000-000000000000";

template <>
inline constexpr wchar_t empty_guid<wchar_t>[37] = L"00000000-0000-0000-0000-000000000000";

template <typename CharT>
inline constexpr CharT guid_encoder[17] = "0123456789abcdef";

template <>
inline constexpr wchar_t guid_encoder<wchar_t>[17] = L"0123456789abcdef";

}  // namespace uuid_detail

// Forward declare uuid & to_string so that we can declare to_string as a friend later.
class Uuid;
template <
    class CharT = char,
    class Traits = std::char_traits<CharT>,
    class Allocator = std::allocator<CharT>>
std::basic_string<CharT, Traits, Allocator> to_string(Uuid const & id);

/// A representation of a Universally Unique IDentifier.
///
/// This code implements part of RFC 4122. It does not aim to be a complete implementation of UUIDs,
/// but provides enough for the uses in the POD5 library.
class Uuid {
public:
    using value_type = uint8_t;

    constexpr Uuid() noexcept = default;

    Uuid(value_type const (&arr)[16]) noexcept
    {
        std::copy(std::cbegin(arr), std::cend(arr), std::begin(m_data));
    }

    constexpr Uuid(std::array<value_type, 16> const & arr) noexcept : m_data{arr} {}

    template <typename ForwardIterator>
    explicit Uuid(ForwardIterator first, ForwardIterator last)
    {
        if (std::distance(first, last) == 16) {
            std::copy(first, last, std::begin(m_data));
        }
    }

    [[nodiscard]] constexpr bool is_nil() const noexcept
    {
        for (size_t i = 0; i < m_data.size(); ++i) {
            if (m_data[i] != 0) {
                return false;
            }
        }
        return true;
    }

    void swap(Uuid & other) noexcept { m_data.swap(other.m_data); }

    uint8_t const * data() const noexcept { return m_data.data(); }

    size_t size() const noexcept { return m_data.size(); }

    void to_c_array(value_type (&arr)[16]) const noexcept
    {
        std::copy(std::cbegin(m_data), std::cend(m_data), std::begin(arr));
    }

    // Note: uustr must be at least 36 characters
    template <typename CharT>
    void write_to(CharT * uustr) const noexcept
    {
        for (size_t i = 0, index = 0; i < 36; ++i) {
            if (i == 8 || i == 13 || i == 18 || i == 23) {
                uustr[i] = uuid_detail::empty_guid<CharT>[i];
                continue;
            }
            uustr[i] = uuid_detail::guid_encoder<CharT>[m_data[index] >> 4 & 0x0f];
            uustr[++i] = uuid_detail::guid_encoder<CharT>[m_data[index] & 0x0f];
            index++;
        }
    }

    template <typename StringType>
    [[nodiscard]] constexpr static std::optional<Uuid> from_string(
        StringType const & in_str) noexcept
    {
        auto str = uuid_detail::to_string_view(in_str);
        bool firstDigit = true;
        size_t hasBraces = 0;
        size_t index = 0;

        std::array<uint8_t, 16> data{{0}};

        if (str.empty()) {
            return {};
        }

        if (str.front() == '{') {
            hasBraces = 1;
        }
        if (hasBraces && str.back() != '}') {
            return {};
        }

        for (size_t i = hasBraces; i < str.size() - hasBraces; ++i) {
            if (str[i] == '-') {
                continue;
            }

            if (index >= 16 || !uuid_detail::is_hex(str[i])) {
                return {};
            }

            if (firstDigit) {
                data[index] = static_cast<uint8_t>(uuid_detail::hex2char(str[i]) << 4);
                firstDigit = false;
            } else {
                data[index] = static_cast<uint8_t>(data[index] | uuid_detail::hex2char(str[i]));
                index++;
                firstDigit = true;
            }
        }

        if (index < 16) {
            return {};
        }

        return Uuid{data};
    }

private:
    std::array<value_type, 16> m_data{{0}};

    friend bool operator==(Uuid const & lhs, Uuid const & rhs) noexcept;
    friend bool operator<(Uuid const & lhs, Uuid const & rhs) noexcept;

    template <class Elem, class Traits>
    friend std::basic_ostream<Elem, Traits> & operator<<(
        std::basic_ostream<Elem, Traits> & s,
        Uuid const & id);

    template <class CharT, class Traits, class Allocator>
    friend std::basic_string<CharT, Traits, Allocator> to_string(Uuid const & id);

    friend std::hash<Uuid>;
};

[[nodiscard]] inline bool operator==(Uuid const & lhs, Uuid const & rhs) noexcept
{
    return lhs.m_data == rhs.m_data;
}

[[nodiscard]] inline bool operator!=(Uuid const & lhs, Uuid const & rhs) noexcept
{
    return !(lhs == rhs);
}

[[nodiscard]] inline bool operator<(Uuid const & lhs, Uuid const & rhs) noexcept
{
    return lhs.m_data < rhs.m_data;
}

template <class CharT, class Traits, class Allocator>
[[nodiscard]] inline std::basic_string<CharT, Traits, Allocator> to_string(Uuid const & id)
{
    std::basic_string<CharT, Traits, Allocator> uustr{uuid_detail::empty_guid<CharT>};
    id.write_to(uustr.data());
    return uustr;
}

template <class Elem, class Traits>
std::basic_ostream<Elem, Traits> & operator<<(std::basic_ostream<Elem, Traits> & s, Uuid const & id)
{
    s << to_string(id);
    return s;
}

inline void swap(Uuid & lhs, Uuid & rhs) noexcept { lhs.swap(rhs); }

template <typename UniformRandomNumberGenerator>
class BasicUuidRandomGenerator {
public:
    using engine_type = UniformRandomNumberGenerator;

    explicit BasicUuidRandomGenerator(engine_type & gen) : generator(&gen) {}

    explicit BasicUuidRandomGenerator(engine_type * gen) : generator(gen) {}

    [[nodiscard]] Uuid operator()()
    {
        alignas(uint32_t) uint8_t bytes[16];
        for (int i = 0; i < 16; i += 4) {
            *reinterpret_cast<uint32_t *>(bytes + i) = distribution(*generator);
        }

        // variant must be 10xxxxxx
        bytes[8] &= 0xBF;
        bytes[8] |= 0x80;

        // version must be 0100xxxx
        bytes[6] &= 0x4F;
        bytes[6] |= 0x40;

        return Uuid{std::begin(bytes), std::end(bytes)};
    }

private:
    std::uniform_int_distribution<uint32_t> distribution;
    UniformRandomNumberGenerator * generator;
};

using UuidRandomGenerator = BasicUuidRandomGenerator<std::mt19937>;

}  // namespace pod5

namespace std {
template <>
struct hash<pod5::Uuid> {
    using argument_type = pod5::Uuid;
    using result_type = std::size_t;

    [[nodiscard]] result_type operator()(argument_type const & uuid) const
    {
        uint64_t l = static_cast<uint64_t>(uuid.m_data[0]) << 56
                     | static_cast<uint64_t>(uuid.m_data[1]) << 48
                     | static_cast<uint64_t>(uuid.m_data[2]) << 40
                     | static_cast<uint64_t>(uuid.m_data[3]) << 32
                     | static_cast<uint64_t>(uuid.m_data[4]) << 24
                     | static_cast<uint64_t>(uuid.m_data[5]) << 16
                     | static_cast<uint64_t>(uuid.m_data[6]) << 8
                     | static_cast<uint64_t>(uuid.m_data[7]);
        uint64_t h = static_cast<uint64_t>(uuid.m_data[8]) << 56
                     | static_cast<uint64_t>(uuid.m_data[9]) << 48
                     | static_cast<uint64_t>(uuid.m_data[10]) << 40
                     | static_cast<uint64_t>(uuid.m_data[11]) << 32
                     | static_cast<uint64_t>(uuid.m_data[12]) << 24
                     | static_cast<uint64_t>(uuid.m_data[13]) << 16
                     | static_cast<uint64_t>(uuid.m_data[14]) << 8
                     | static_cast<uint64_t>(uuid.m_data[15]);

        if constexpr (sizeof(result_type) > 4) {
            return result_type(l ^ h);
        } else {
            uint64_t hash64 = l ^ h;
            return result_type(uint32_t(hash64 >> 32) ^ uint32_t(hash64));
        }
    }
};
}  // namespace std


================================================
FILE: c++/pod5_format/version.h.in
================================================
#pragma once

#include <string>

namespace pod5 {

std::uint16_t const Pod5MajorVersion = @POD5_VERSION_MAJOR@;
std::uint16_t const Pod5MinorVersion = @POD5_VERSION_MINOR@;
std::uint16_t const Pod5RevVersion = @POD5_VERSION_REV@;

std::string const Pod5Version = "@POD5_NUMERIC_VERSION@";

}


================================================
FILE: c++/pod5_format_pybind/CMakeLists.txt
================================================

pybind11_add_module(pod5_format_pybind
    api.h
    bindings.cpp
    utils.h
    subset.cpp
    subset.h

    repack/repack_functions.h
    repack/repack_states.h
    repack/repack_utils.h
    repack/repack_output.cpp
    repack/repack_output.h
    repack/repacker.cpp
    repack/repacker.h
)

target_link_libraries(pod5_format_pybind
    PRIVATE
        pod5_format
)

if (NOT MSVC)
    target_compile_options(pod5_format_pybind PRIVATE ${pod5_warning_options})
endif()

set_target_properties(pod5_format_pybind
    PROPERTIES
        POSITION_INDEPENDENT_CODE 1
        CXX_STANDARD 20
)

# Non-conan license files to copy.
set(pod5_cxx_licenses_src
    "${CMAKE_SOURCE_DIR}/LICENSE.md"
    "${CMAKE_SOURCE_DIR}/third_party/licenses/gsl-lite.txt"
    "${CMAKE_SOURCE_DIR}/third_party/pybind11/LICENSE"
)
# Destination name for the above files.
set(pod5_cxx_licenses_dst
    "LICENSE.md"
    "gsl-lite.txt"
    "pybind11.txt"
)

set(python_project_root "${CMAKE_SOURCE_DIR}/python/lib_pod5/")

configure_file(
    ${CMAKE_CURRENT_SOURCE_DIR}/_version.py.in
    ${python_project_root}/src/lib_pod5/_version.py
)

set(wheel_output_stub "${CMAKE_CURRENT_BINARY_DIR}/wheel.touch")

set(wheel_output_dir "${CMAKE_CURRENT_BINARY_DIR}/wheel_${POD5_FULL_VERSION}")
file(MAKE_DIRECTORY ${wheel_output_dir})

add_custom_command(
    OUTPUT "${wheel_output_stub}"
    COMMAND ${CMAKE_COMMAND}
    ARGS
        -D "PYTHON_EXECUTABLE=${Python_EXECUTABLE}"
        -D "PYTHON_PROJECT_DIR=${python_project_root}"
        -D "PYBIND_INPUT_LIB=$<TARGET_FILE:pod5_format_pybind>"
        -D "WHEEL_OUTPUT_DIR=${wheel_output_dir}"
        -D "POD5_CONAN_LICENSES=${CMAKE_BINARY_DIR}/pod5_conan_licenses"
        -D "POD5_CXX_LICENSES_SRC=${pod5_cxx_licenses_src}"
        -D "POD5_CXX_LICENSES_DST=${pod5_cxx_licenses_dst}"
        -P "${CMAKE_CURRENT_SOURCE_DIR}/build_wheel.cmake"
    DEPENDS
        pod5_format_pybind
    VERBATIM
)

add_custom_target(lib_pod5_python_wheel ALL
    SOURCES
        build_wheel.cmake
    DEPENDS
        "${wheel_output_stub}"
)

install(
    DIRECTORY "${wheel_output_dir}/"
    DESTINATION "."
    COMPONENT wheel
    FILES_MATCHING PATTERN "lib_pod5*.whl"
)


================================================
FILE: c++/pod5_format_pybind/_version.py.in
================================================
# This file is auto generated by cmake during compilation
__version__ = version = "@POD5_FULL_VERSION@"
__version_tuple__ = version_tuple = (@POD5_VERSION_MAJOR@, @POD5_VERSION_MINOR@, @POD5_VERSION_REV@)


================================================
FILE: c++/pod5_format_pybind/api.h
================================================
#pragma once

#include "pod5_format/async_signal_loader.h"
#include "pod5_format/c_api.h"
#include "pod5_format/file_reader.h"
#include "pod5_format/file_updater.h"
#include "pod5_format/file_writer.h"
#include "pod5_format/read_table_reader.h"
#include "pod5_format/signal_compression.h"
#include "pod5_format/signal_table_reader.h"
#include "pod5_format/thread_pool.h"
#include "pod5_format/uuid.h"
#include "utils.h"

#include <arrow/memory_pool.h>
#include <pybind11/numpy.h>
#include <pybind11/pybind11.h>
#include <pybind11/stl.h>

namespace py = pybind11;

inline std::shared_ptr<pod5::FileWriter> create_file(
    char const * path,
    std::string const & writer_name,
    pod5::FileWriterOptions const * options)
{
    pod5::FileWriterOptions dummy;
    POD5_PYTHON_ASSIGN_OR_RAISE(
        auto writer,
        pod5::create_file_writer(
            path, writer_name, options ? *options : pod5::FileWriterOptions{}));
    return writer;
}

inline pod5::RecoveryDetails recover_file(
    char const * src_filename,
    char const * dest_filename,
    pod5::RecoverFileOptions const * const options)
{
    POD5_PYTHON_ASSIGN_OR_RAISE(
        pod5::RecoveryDetails details,
        pod5::recover_file(
            src_filename, dest_filename, options ? *options : pod5::RecoverFileOptions{}));
    return details;
}

class Pod5SignalCacheBatch {
public:
    Pod5SignalCacheBatch(
        pod5::AsyncSignalLoader::SamplesMode samples_mode,
        pod5::CachedBatchSignalData && cached_data)
    : m_samples_mode(samples_mode)
    , m_cached_data(std::move(cached_data))
    {
    }

    py::array_t<std::uint64_t> sample_count() const
    {
        return py::array_t<std::uint64_t>(
            m_cached_data.sample_count().size(), m_cached_data.sample_count().data());
    }

    py::list samples() const
    {
        py::list py_samples;
        if (m_samples_mode != pod5::AsyncSignalLoader::SamplesMode::Samples) {
            return py_samples;
        }
        for (auto const & row_samples : m_cached_data.samples()) {
            py_samples.append(
                py::array_t<std::int16_t>(
                    {row_samples.size()}, {sizeof(std::int16_t)}, row_samples.data()));
        }

        return py_samples;
    }

    std::uint32_t batch_index() const { return m_cached_data.batch_index(); }

private:
    pod5::AsyncSignalLoader::SamplesMode m_samples_mode;
    pod5::CachedBatchSignalData m_cached_data;
};

class Pod5AsyncSignalLoader {
public:
    // Make an async loader for all reads in the file
    Pod5AsyncSignalLoader(
        std::shared_ptr<pod5::FileReader> const & reader,
        pod5::AsyncSignalLoader::SamplesMode samples_mode,
        std::size_t worker_count = std::thread::hardware_concurrency(),
        std::size_t max_pending_batches = 10)
    : m_samples_mode(samples_mode)
    , m_batch_counts_ref({})
    , m_batch_rows_ref({})
    , m_async_loader(reader, samples_mode, {}, {}, worker_count, max_pending_batches)
    {
    }

    // Make an async loader for specific batches
    Pod5AsyncSignalLoader(
        std::shared_ptr<pod5::FileReader> const & reader,
        pod5::AsyncSignalLoader::SamplesMode samples_mode,
        py::array_t<std::uint32_t, py::array::c_style | py::array::forcecast> && batches,
        std::size_t worker_count = std::thread::hardware_concurrency(),
        std::size_t max_pending_batches = 10)
    : m_samples_mode(samples_mode)
    , m_batch_sizes(make_batch_counts(reader, batches))
    , m_async_loader(
          reader,
          samples_mode,
          gsl::make_span(m_batch_sizes),
          {},
          worker_count,
          max_pending_batches)
    {
    }

    // Make an async loader for specific reads in specific batches
    Pod5AsyncSignalLoader(
        std::shared_ptr<pod5::FileReader> const & reader,
        pod5::AsyncSignalLoader::SamplesMode samples_mode,
        py::array_t<std::uint32_t, py::array::c_style | py::array::forcecast> && batch_counts,
        py::array_t<std::uint32_t, py::array::c_style | py::array::forcecast> && batch_rows,
        std::size_t worker_count = std::thread::hardware_concurrency(),
        std::size_t max_pending_batches = 10)
    : m_samples_mode(samples_mode)
    , m_batch_counts_ref(std::move(batch_counts))
    , m_batch_rows_ref(std::move(batch_rows))
    , m_async_loader(
          reader,
          samples_mode,
          gsl::make_span(m_batch_counts_ref.data(), m_batch_counts_ref.size()),
          gsl::make_span(m_batch_rows_ref.data(), m_batch_rows_ref.size()),
          worker_count,
          max_pending_batches)
    {
    }

    std::shared_ptr<Pod5SignalCacheBatch> release_next_batch()
    {
        auto batch = m_async_loader.release_next_batch();
        if (!batch.ok()) {
            throw std::runtime_error(batch.status().ToString());
        }

        if (!*batch) {
            assert(m_async_loader.is_finished());
            throw pybind11::stop_iteration();
        }

        return std::make_shared<Pod5SignalCacheBatch>(m_samples_mode, std::move(**batch));
    }

    std::vector<std::uint32_t> make_batch_counts(
        std::shared_ptr<pod5::FileReader> const & reader,
        py::array_t<std::uint32_t, py::array::c_style | py::array::forcecast> const & batches)
    {
        std::vector<std::uint32_t> batch_counts(reader->num_read_record_batches(), 0);
        for (auto const & batch_idx : gsl::make_span(batches.data(), batches.shape(0))) {
            auto read_batch = reader->read_read_record_batch(batch_idx);
            if (!read_batch.ok()) {
                throw std::runtime_error(
                    "Failed to query read batch count: " + read_batch.status().ToString());
            }

            batch_counts[batch_idx] = read_batch->num_rows();
        }
        return batch_counts;
    }

    pod5::AsyncSignalLoader::SamplesMode m_samples_mode;
    std::vector<std::uint32_t> m_batch_sizes;
    py::array_t<std::uint32_t, py::array::c_style | py::array::forcecast> m_batch_counts_ref;
    py::array_t<std::uint32_t, py::array::c_style | py::array::forcecast> m_batch_rows_ref;
    pod5::AsyncSignalLoader m_async_loader;
};

struct Pod5FileReaderPtr {
    std::shared_ptr<pod5::FileReader> reader = nullptr;

    Pod5FileReaderPtr(std::shared_ptr<pod5::FileReader> && reader_) : reader(std::move(reader_)) {}

    pod5::FileLocation get_file_run_info_table_location() const
    {
        return reader->run_info_table_location();
    }

    pod5::FileLocation get_file_read_table_location() const
    {
        return reader->read_table_location();
    }

    pod5::FileLocation get_file_signal_table_location() const
    {
        return reader->signal_table_location();
    }

    std::string get_file_version_pre_migration() const
    {
        return reader->file_version_pre_migration().to_string();
    }

    void close() { reader = nullptr; }

    std::size_t plan_traversal(
        py::array_t<std::uint8_t, py::array::c_style | py::array::forcecast> const & read_id_data,
        py::array_t<std::uint32_t, py::array::c_style | py::array::forcecast> & batch_counts,
        py::array_t<std::uint32_t, py::array::c_style | py::array::forcecast> & batch_rows)
    {
        auto const read_id_count = read_id_data.shape(0);
        auto search_input = pod5::ReadIdSearchInput(
            gsl::make_span(
                reinterpret_cast<pod5::Uuid const *>(read_id_data.data()), read_id_count));

        POD5_PYTHON_ASSIGN_OR_RAISE(
            auto find_success_count,
            reader->search_for_read_ids(
                search_input,
                gsl::make_span(batch_counts.mutable_data(), reader->num_read_record_batches()),
                gsl::make_span(batch_rows.mutable_data(), read_id_count)));

        return find_success_count;
    }

    std::shared_ptr<Pod5AsyncSignalLoader> batch_get_signal(bool get_samples, bool get_sample_count)
    {
        return std::make_shared<Pod5AsyncSignalLoader>(
            reader,
            get_samples ? pod5::AsyncSignalLoader::SamplesMode::Samples
                        : pod5::AsyncSignalLoader::SamplesMode::NoSamples);
    }

    std::shared_ptr<Pod5AsyncSignalLoader> batch_get_signal_batches(
        bool get_samples,
        bool get_sample_count,
        py::array_t<std::uint32_t, py::array::c_style | py::array::forcecast> && batches)
    {
        return std::make_shared<Pod5AsyncSignalLoader>(
            reader,
            get_samples ? pod5::AsyncSignalLoader::SamplesMode::Samples
                        : pod5::AsyncSignalLoader::SamplesMode::NoSamples,
            std::move(batches));
    }

    std::shared_ptr<Pod5AsyncSignalLoader> batch_get_signal_selection(
        bool get_samples,
        bool get_sample_count,
        py::array_t<std::uint32_t, py::array::c_style | py::array::forcecast> && batch_counts,
        py::array_t<std::uint32_t, py::array::c_style | py::array::forcecast> && batch_rows)
    {
        return std::make_shared<Pod5AsyncSignalLoader>(
            reader,
            get_samples ? pod5::AsyncSignalLoader::SamplesMode::Samples
                        : pod5::AsyncSignalLoader::SamplesMode::NoSamples,
            std::move(batch_counts),
            std::move(batch_rows));
    }
};

inline Pod5FileReaderPtr open_file(char const * filename)
{
    POD5_PYTHON_ASSIGN_OR_RAISE(auto reader, pod5::open_file_reader(filename, {}));
    return Pod5FileReaderPtr(std::move(reader));
}

inline void write_updated_file_to_dest(Pod5FileReaderPtr source, char const * dest_filename)
{
    POD5_PYTHON_RETURN_NOT_OK(
        pod5::update_file(arrow::default_memory_pool(), source.reader, dest_filename));
}

inline pod5::RunInfoDictionaryIndex FileWriter_add_run_info(
    pod5::FileWriter & w,
    std::string & acquisition_id,
    std::int64_t acquisition_start_time,
    std::int16_t adc_max,
    std::int16_t adc_min,
    std::vector<std::pair<std::string, std::string>> && context_tags,
    std::string & experiment_name,
    std::string & flow_cell_id,
    std::string & flow_cell_product_code,
    std::string & protocol_name,
    std::string & protocol_run_id,
    std::int64_t protocol_start_time,
    std::string & sample_id,
    std::uint16_t sample_rate,
    std::string & sequencing_kit,
    std::string & sequencer_position,
    std::string & sequencer_position_type,
    std::string & software,
    std::string & system_name,
    std::string & system_type,
    std::vector<std::pair<std::string, std::string>> && tracking_id)
{
    return throw_on_error(w.add_run_info(
        {std::move(acquisition_id),
         acquisition_start_time,
         adc_max,
         adc_min,
         std::move(context_tags),
         std::move(experiment_name),
         std::move(flow_cell_id),
         std::move(flow_cell_product_code),
         std::move(protocol_name),
         std::move(protocol_run_id),
         std::move(protocol_start_time),
         std::move(sample_id),
         sample_rate,
         std::move(sequencing_kit),
         std::move(sequencer_position),
         std::move(sequencer_position_type),
         std::move(software),
         std::move(system_name),
         std::move(system_type),
         std::move(tracking_id)}));
}

inline pod5::ReadData make_read_data(
    std::size_t row_id,
    py::array_t<std::uint8_t, py::array::c_style | py::array::forcecast> const & read_id_data,
    py::array_t<std::uint32_t, py::array::c_style | py::array::forcecast> const & read_numbers,
    py::array_t<std::uint64_t, py::array::c_style | py::array::forcecast> const & start_samples,
    py::array_t<std::uint16_t, py::array::c_style | py::array::forcecast> const & channels,
    py::array_t<std::uint8_t, py::array::c_style | py::array::forcecast> const & wells,
    py::array_t<std::int16_t, py::array::c_style | py::array::forcecast> const & pore_types,
    py::array_t<float, py::array::c_style | py::array::forcecast> const & calibration_offsets,
    py::array_t<float, py::array::c_style | py::array::forcecast> const & calibration_scales,
    py::array_t<float, py::array::c_style | py::array::forcecast> const & median_befores,
    py::array_t<std::int16_t, py::array::c_style | py::array::forcecast> const & end_reasons,
    py::array_t<bool, py::array::c_style | py::array::forcecast> const & end_reason_forceds,
    py::array_t<std::int16_t, py::array::c_style | py::array::forcecast> const & run_infos,
    py::array_t<std::uint64_t, py::array::c_style | py::array::forcecast> const &
        num_minknow_events,
    py::array_t<float, py::array::c_style | py::array::forcecast> const & tracked_scaling_scale,
    py::array_t<float, py::array::c_style | py::array::forcecast> const & tracked_scaling_shift,
    py::array_t<float, py::array::c_style | py::array::forcecast> const & predicted_scaling_scale,
    py::array_t<float, py::array::c_style | py::array::forcecast> const & predicted_scaling_shift,
    py::array_t<std::uint32_t, py::array::c_style | py::array::forcecast> const &
        num_reads_since_mux_change,
    py::array_t<float, py::array::c_style | py::array::forcecast> const & time_since_mux_change,
    py::array_t<float, py::array::c_style | py::array::forcecast> const & open_pore_level)
{
    auto read_ids = reinterpret_cast<pod5::Uuid const *>(read_id_data.data(0));
    return pod5::ReadData{
        read_ids[row_id],
        *read_numbers.data(row_id),
        *start_samples.data(row_id),
        *channels.data(row_id),
        *wells.data(row_id),
        *pore_types.data(row_id),
        *calibration_offsets.data(row_id),
        *calibration_scales.data(row_id),
        *median_befores.data(row_id),
        *end_reasons.data(row_id),
        *end_reason_forceds.data(row_id),
        *run_infos.data(row_id),
        *num_minknow_events.data(row_id),
        *tracked_scaling_scale.data(row_id),
        *tracked_scaling_shift.data(row_id),
        *predicted_scaling_scale.data(row_id),
        *predicted_scaling_shift.data(row_id),
        *num_reads_since_mux_change.data(row_id),
        *time_since_mux_change.data(row_id),
        *open_pore_level.data(row_id)};
}

inline void FileWriter_add_reads(
    pod5::FileWriter & w,
    std::size_t count,
    py::array_t<std::uint8_t, py::array::c_style | py::array::forcecast> const & read_id_data,
    py::array_t<std::uint32_t, py::array::c_style | py::array::forcecast> const & read_numbers,
    py::array_t<std::uint64_t, py::array::c_style | py::array::forcecast> const & start_samples,
    py::array_t<std::uint16_t, py::array::c_style | py::array::forcecast> const & channels,
    py::array_t<std::uint8_t, py::array::c_style | py::array::forcecast> const & wells,
    py::array_t<std::int16_t, py::array::c_style | py::array::forcecast> const & pore_types,
    py::array_t<float, py::array::c_style | py::array::forcecast> const & calibration_offsets,
    py::array_t<float, py::array::c_style | py::array::forcecast> const & calibration_scales,
    py::array_t<float, py::array::c_style | py::array::forcecast> const & median_befores,
    py::array_t<std::int16_t, py::array::c_style | py::array::forcecast> const & end_reasons,
    py::array_t<bool, py::array::c_style | py::array::forcecast> const & end_reason_forceds,
    py::array_t<std::int16_t, py::array::c_style | py::array::forcecast> const & run_infos,
    py::array_t<std::uint64_t, py::array::c_style | py::array::forcecast> const &
        num_minknow_events,
    py::array_t<float, py::array::c_style | py::array::forcecast> const & tracked_scaling_scales,
    py::array_t<float, py::array::c_style | py::array::forcecast> const & tracked_scaling_shifts,
    py::array_t<float, py::array::c_style | py::array::forcecast> const & predicted_scaling_scales,
    py::array_t<float, py::array::c_style | py::array::forcecast> const & predicted_scaling_shifts,
    py::array_t<std::uint32_t, py::array::c_style | py::array::forcecast> const &
        num_reads_since_mux_changes,
    py::array_t<float, py::array::c_style | py::array::forcecast> const & time_since_mux_changes,
    py::array_t<float, py::array::c_style | py::array::forcecast> const & open_pore_levels,
    py::list signal_ptrs)
{
    if (read_id_data.shape(1) != 16) {
        throw std::runtime_error("Read id array is of unexpected size");
    }

    auto signal_it = signal_ptrs.begin();
    for (std::size_t i = 0; i < count; ++i, ++signal_it) {
        if (signal_it == signal_ptrs.end()) {
            throw std::runtime_error("Missing signal data");
        }
        auto signal =
            signal_it->cast<py::array_t<std::int16_t, py::array::c_style | py::array::forcecast>>();
        auto signal_span = gsl::make_span(signal.data(), signal.size());

        auto read_data = make_read_data(
            i,
            read_id_data,
            read_numbers,
            start_samples,
            channels,
            wells,
            pore_types,
            calibration_offsets,
            calibration_scales,
            median_befores,
            end_reasons,
            end_reason_forceds,
            run_infos,
            num_minknow_events,
            tracked_scaling_scales,
            tracked_scaling_shifts,
            predicted_scaling_scales,
            predicted_scaling_shifts,
            num_reads_since_mux_changes,
            time_since_mux_changes,
            open_pore_levels);

        throw_on_error(w.add_complete_read(read_data, signal_span));
    }
}

inline void FileWriter_add_reads_pre_compressed(
    pod5::FileWriter & w,
    std::size_t count,
    py::array_t<std::uint8_t, py::array::c_style | py::array::forcecast> const & read_id_data,
    py::array_t<std::uint32_t, py::array::c_style | py::array::forcecast> const & read_numbers,
    py::array_t<std::uint64_t, py::array::c_style | py::array::forcecast> const & start_samples,
    py::array_t<std::uint16_t, py::array::c_style | py::array::forcecast> const & channels,
    py::array_t<std::uint8_t, py::array::c_style | py::array::forcecast> const & wells,
    py::array_t<std::int16_t, py::array::c_style | py::array::forcecast> const & pore_types,
    py::array_t<float, py::array::c_style | py::array::forcecast> const & calibration_offsets,
    py::array_t<float, py::array::c_style | py::array::forcecast> const & calibration_scales,
    py::array_t<float, py::array::c_style | py::array::forcecast> const & median_befores,
    py::array_t<std::int16_t, py::array::c_style | py::array::forcecast> const & end_reasons,
    py::array_t<bool, py::array::c_style | py::array::forcecast> const & end_reason_forceds,
    py::array_t<std::int16_t, py::array::c_style | py::array::forcecast> const & run_infos,
    py::array_t<std::uint64_t, py::array::c_style | py::array::forcecast> const &
        num_minknow_events,
    py::array_t<float, py::array::c_style | py::array::forcecast> const & tracked_scaling_scales,
    py::array_t<float, py::array::c_style | py::array::forcecast> const & tracked_scaling_shifts,
    py::array_t<float, py::array::c_style | py::array::forcecast> const & predicted_scaling_scales,
    py::array_t<float, py::array::c_style | py::array::forcecast> const & predicted_scaling_shifts,
    py::array_t<std::uint32_t, py::array::c_style | py::array::forcecast> const &
        num_reads_since_mux_changes,
    py::array_t<float, py::array::c_style | py::array::forcecast> const & time_since_mux_changes,
    py::array_t<float, py::array::c_style | py::array::forcecast> const & open_pore_levels,
    py::list compressed_signal_ptrs,
    py::array_t<std::uint32_t, py::array::c_style | py::array::forcecast> const & sample_counts,
    py::array_t<std::uint32_t, py::array::c_style | py::array::forcecast> const &
        signal_chunk_counts)
{
    if (read_id_data.shape(1) != 16) {
        throw std::runtime_error("Read id array is of unexpected size");
    }

    auto read_ids = reinterpret_cast<pod5::Uuid const *>(read_id_data.data(0));
    auto compressed_signal_it = compressed_signal_ptrs.begin();
    auto sample_counts_it = sample_counts.data();
    for (std::size_t i = 0; i < count; ++i) {
        auto const read_id = read_ids[i];

        auto const signal_chunk_count = *signal_chunk_counts.data(i);
        std::uint64_t signal_duration_count = 0;
        std::vector<std::uint64_t> signal_rows(signal_chunk_count);
        for (std::size_t signal_chunk_idx = 0; signal_chunk_idx < signal_chunk_count;
             ++signal_chunk_idx)
        {
            if (compressed_signal_it == compressed_signal_ptrs.end()) {
                throw std::runtime_error("Missing signal data");
            }
            auto compressed_signal =
                compressed_signal_it
                    ->cast<py::array_t<std::uint8_t, py::array::c_style | py::array::forcecast>>();
            auto compressed_signal_span =
                gsl::make_span(compressed_signal.data(), compressed_signal.size());

            auto signal_row = throw_on_error(
                w.add_pre_compressed_signal(read_id, compressed_signal_span, *sample_counts_it));
            signal_rows[signal_chunk_idx] = signal_row;

            signal_duration_count += *sample_counts_it;
            ++compressed_signal_it;
            ++sample_counts_it;
        }

        auto read_data = make_read_data(
            i,
            read_id_data,
            read_numbers,
            start_samples,
            channels,
            wells,
            pore_types,
            calibration_offsets,
            calibration_scales,
            median_befores,
            end_reasons,
            end_reason_forceds,
            run_infos,
            num_minknow_events,
            tracked_scaling_scales,
            tracked_scaling_shifts,
            predicted_scaling_scales,
            predicted_scaling_shifts,
            num_reads_since_mux_changes,
            time_since_mux_changes,
            open_pore_levels);

        throw_on_error(w.add_complete_read(read_data, signal_rows, signal_duration_count));
    }
}

inline void decompress_signal_wrapper(
    py::array_t<uint8_t, py::array::c_style | py::array::forcecast> const & compressed_signal,
    py::array_t<std::int16_t, py::array::c_style | py::array::forcecast> & signal_out)
{
    throw_on_error(
        pod5::decompress_signal(
            gsl::make_span(compressed_signal.data(0), compressed_signal.shape(0)),
            arrow::system_memory_pool(),
            gsl::make_span(signal_out.mutable_data(0), signal_out.shape(0))));
}

inline std::size_t compress_signal_wrapper(
    py::array_t<std::int16_t, py::array::c_style | py::array::forcecast> const & signal,
    py::array_t<std::uint8_t, py::array::c_style | py::array::forcecast> & compressed_signal_out)
{
    auto size = throw_on_error(
        pod5::compress_signal(
            gsl::make_span(signal.data(), signal.shape(0)),
            arrow::system_memory_pool(),
            gsl::make_span(compressed_signal_out.mutable_data(), compressed_signal_out.shape(0))));

    return size;
}

inline std::size_t vbz_compressed_signal_max_size(std::size_t sample_count)
{
    POD5_PYTHON_ASSIGN_OR_RAISE(
        std::size_t const max_size, pod5::compressed_signal_max_size(sample_count));
    return max_size;
}

inline std::size_t load_read_id_iterable(
    py::iterable const & read_ids_str,
    py::array_t<std::uint8_t, py::array::c_style | py::array::forcecast> & read_id_data_out)
{
    std::size_t out_idx = 0;
    auto read_ids = reinterpret_cast<pod5::Uuid *>(read_id_data_out.mutable_data());
    auto read_ids_out_len = read_id_data_out.shape(0);

    std::string temp_uuid;
    for (auto & read_id : read_ids_str) {
        if (out_idx >= (std::size_t)read_ids_out_len) {
            throw std::runtime_error("Too many input uuids for output container");
        }

        temp_uuid = read_id.cast<py::str>();
        if (auto const found_uuid = pod5::Uuid::from_string(temp_uuid)) {
            read_ids[out_idx++] = *found_uuid;
        }
        // if it's invalid, ignore it - we will return one fewer read ids than expected and the caller can deal with it.
    }

    return out_idx;
}

inline py::list format_read_id_to_str(
    py::array_t<std::uint8_t, py::array::c_style | py::array::forcecast> & read_id_data_out)
{
    if (read_id_data_out.size() % 16 != 0) {
        throw std::runtime_error(
            "Unexpected amount of data for read id - expected data to align to 16 bytes.");
    }

    py::list result;

    std::array<char, 37> str_data;
    std::size_t const count = read_id_data_out.size() / 16;
    for (std::size_t i = 0; i < count; ++i) {
        auto read_id_data = read_id_data_out.data() + (i * 16);

        pod5_format_read_id(read_id_data, str_data.data());
        result.append(py::str(str_data.data(), str_data.size() - 1));
    }

    return result;
}


================================================
FILE: c++/pod5_format_pybind/bindings.cpp
================================================
#include "api.h"
#include "pod5_format/c_api.h"
#include "repack/repack_output.h"
#include "repack/repacker.h"
#include "subset.h"

PYBIND11_MODULE(pod5_format_pybind, m)
{
    using namespace pod5;
    pod5_init();

    m.doc() = "POD5 Format Raw Bindings";

    py::enum_<SignalType>(m, "SignalType", py::arithmetic(), "SignalType enum")
        .value("UncompressedSignal", SignalType::UncompressedSignal, "Signal is not compressed")
        .value("VbzSignal", SignalType::VbzSignal, "Signal is compressed using vbz")
        .export_values();

    py::class_<FileWriterOptions>(m, "FileWriterOptions")
        .def(py::init<>())
        .def_property(
            "max_signal_chunk_size",
            &FileWriterOptions::max_signal_chunk_size,
            &FileWriterOptions::set_max_signal_chunk_size)
        .def_property(
            "signal_table_batch_size",
            &FileWriterOptions::signal_table_batch_size,
            &FileWriterOptions::set_signal_table_batch_size)
        .def_property(
            "read_table_batch_size",
            &FileWriterOptions::read_table_batch_size,
            &FileWriterOptions::set_read_table_batch_size)
        .def_property(
            "signal_compression_type",
            &FileWriterOptions::signal_type,
            &FileWriterOptions::set_signal_type);

    py::class_<FileWriter, std::shared_ptr<FileWriter>>(m, "FileWriter")
        .def("close", [](pod5::FileWriter & w) { throw_on_error(w.close()); })
        .def(
            "add_pore",
            [](pod5::FileWriter & w, std::string pore_type) {
                return throw_on_error(w.add_pore_type(std::move(pore_type)));
            })
        .def(
            "add_end_reason",
            [](pod5::FileWriter & w, int name) {
                return throw_on_error(w.lookup_end_reason((pod5::ReadEndReason)name));
            })
        .def("add_run_info", FileWriter_add_run_info)
        .def("add_reads", FileWriter_add_reads)
        .def("add_reads_pre_compressed", FileWriter_add_reads_pre_compressed);

    py::class_<pod5::FileLocation>(m, "EmbeddedFileData")
        .def_readonly("file_path", &pod5::FileLocation::file_path)
        .def_readonly("offset", &pod5::FileLocation::offset)
        .def_readonly("length", &pod5::FileLocation::size);

    py::class_<Pod5AsyncSignalLoader, std::shared_ptr<Pod5AsyncSignalLoader>>(
        m, "Pod5AsyncSignalLoader")
        .def("release_next_batch", &Pod5AsyncSignalLoader::release_next_batch);

    py::class_<Pod5SignalCacheBatch, std::shared_ptr<Pod5SignalCacheBatch>>(
        m, "Pod5SignalCacheBatch")
        .def_property_readonly("batch_index", &Pod5SignalCacheBatch::batch_index)
        .def_property_readonly("sample_count", &Pod5SignalCacheBatch::sample_count)
        .def_property_readonly("samples", &Pod5SignalCacheBatch::samples);

    py::class_<Pod5FileReaderPtr>(m, "Pod5FileReader")
        .def(
            "get_file_run_info_table_location",
            &Pod5FileReaderPtr::get_file_run_info_table_location)
        .def("get_file_read_table_location", &Pod5FileReaderPtr::get_file_read_table_location)
        .def("get_file_signal_table_location", &Pod5FileReaderPtr::get_file_signal_table_location)
        .def("get_file_version_pre_migration", &Pod5FileReaderPtr::get_file_version_pre_migration)
        .def("plan_traversal", &Pod5FileReaderPtr::plan_traversal)
        .def("batch_get_signal", &Pod5FileReaderPtr::batch_get_signal)
        .def("batch_get_signal_selection", &Pod5FileReaderPtr::batch_get_signal_selection)
        .def("batch_get_signal_batches", &Pod5FileReaderPtr::batch_get_signal_batches)
        .def("close", &Pod5FileReaderPtr::close);

    // Errors API
    m.def("get_error_string", &pod5_get_error_string, "Get the most recent error as a string");

    // Creating files
    m.def(
        "create_file",
        &create_file,
        "Create a POD5 file for writing",
        py::arg("filename"),
        py::arg("writer_name"),
        py::arg("options") = nullptr);

    // Opening files
    m.def("open_file", &open_file, "Open a POD5 file for reading");

    // Recovering files
    py::class_<RecoverFileOptions>(m, "RecoverFileOptions")
        .def(py::init<>())
        .def_readwrite("file_writer_options", &RecoverFileOptions::file_writer_options)
        .def_readwrite("cleanup", &RecoverFileOptions::cleanup);
    py::class_<RecoveredRowCounts>(m, "RecoveredRowCounts")
        .def(py::init<>())
        .def_readwrite("signal", &RecoveredRowCounts::signal)
        .def_readwrite("run_info", &RecoveredRowCounts::run_info)
        .def_readwrite("reads", &RecoveredRowCounts::reads);
    py::class_<CleanupError>(m, "CleanupError")
        .def(py::init<>())
        .def_readwrite("file_path", &CleanupError::file_path)
        .def_readwrite("description", &CleanupError::description);
    py::class_<RecoveryDetails>(m, "RecoveryDetails")
        .def(py::init<>())
        .def_readwrite("row_counts", &RecoveryDetails::row_counts)
        .def_readwrite("cleanup_errors", &RecoveryDetails::cleanup_errors);
    m.def(
        "recover_file",
        &::recover_file,
        "Recover a POD5 file which was not closed correctly",
        py::arg("src_filename"),
        py::arg("dest_filename"),
        py::arg("options") = nullptr);

    m.def(
        "update_file",
        &write_updated_file_to_dest,
        "Update a POD5 file to the latest writer format");

    // Signal API
    m.def("decompress_signal", &decompress_signal_wrapper, "Decompress a numpy array of signal");
    m.def("compress_signal", &compress_signal_wrapper, "Compress a numpy array of signal");
    m.def("vbz_compressed_signal_max_size", &vbz_compressed_signal_max_size);

    // Repacker API
    py::class_<repack::Pod5RepackerOutput, std::shared_ptr<repack::Pod5RepackerOutput>>(
        m, "Pod5RepackerOutput");

    py::class_<repack::Pod5Repacker, std::shared_ptr<repack::Pod5Repacker>>(m, "Repacker")
        .def(py::init<>())
        .def("add_output", &repack::Pod5Repacker::add_output)
        .def("set_output_finished", &repack::Pod5Repacker::set_output_finished)
        .def("add_all_reads_to_output", &repack::Pod5Repacker::add_all_reads_to_output)
        .def("add_selected_reads_to_output", &repack::Pod5Repacker::py_add_selected_reads_to_output)
        .def("finish", &repack::Pod5Repacker::finish)
        .def_property_readonly("is_complete", &repack::Pod5Repacker::is_complete)
        .def_property_readonly(
            "currently_open_file_reader_count",
            &repack::Pod5Repacker::currently_open_file_reader_count)
        .def_property_readonly("reads_completed", &repack::Pod5Repacker::reads_completed);

    // Util API
    m.def(
        "load_read_id_iterable",
        &load_read_id_iterable,
        "Load an iterable of read ids into a numpy array of data");
    m.def("format_read_id_to_str", &format_read_id_to_str, "Format an array of read ids to string");

    m.def(
        "subset_pod5s_with_mapping",
        &subset_pod5s_with_mapping,
        "Subset pod5 files given a mapping");
}


================================================
FILE: c++/pod5_format_pybind/build_wheel.cmake
================================================

message("Building python lib-pod5 wheel using ${PYTHON_EXECUTABLE}")
message("  project dir ${PYTHON_PROJECT_DIR}")
message("  with lib ${PYBIND_INPUT_LIB}")
message("  with conan licenses ${POD5_CONAN_LICENSES}")
message("  with c++ licenses ${POD5_CXX_LICENSES_SRC}")
message("  into ${WHEEL_OUTPUT_DIR}")
message("  using: ${PYTHON_EXECUTABLE} -m pip wheel . --wheel-dir ${WHEEL_OUTPUT_DIR}")

# Copy the prebuilt lib into the wheel src.
file(COPY "${PYBIND_INPUT_LIB}" DESTINATION "${PYTHON_PROJECT_DIR}/src/lib_pod5")

# Copy the licenses into the wheel src.
# Note: the trailing / on src is important since it tells cmake to copy only the contents.
if(EXISTS "${POD5_CONAN_LICENSES}")
    file(INSTALL "${POD5_CONAN_LICENSES}/" DESTINATION "${PYTHON_PROJECT_DIR}/licenses")
endif()

foreach(license_src license_dst IN ZIP_LISTS POD5_CXX_LICENSES_SRC POD5_CXX_LICENSES_DST)
    file(COPY_FILE "${license_src}" "${PYTHON_PROJECT_DIR}/licenses/${license_dst}")
endforeach()

execute_process(
    COMMAND ${PYTHON_EXECUTABLE} -m pip wheel . --wheel-dir ${WHEEL_OUTPUT_DIR}
    WORKING_DIRECTORY "${PYTHON_PROJECT_DIR}/"
    RESULT_VARIABLE exit_code
    OUTPUT_VARIABLE output
    ERROR_VARIABLE output
)

if (NOT exit_code EQUAL 0)
    message(FATAL_ERROR "Could not generate wheel: ${output}")
endif()

file(GLOB pod5_wheel_names "${WHEEL_OUTPUT_DIR}/*.whl")
foreach(wheel ${pod5_wheel_names})
    message("Built wheel ${wheel}")
endforeach()


================================================
FILE: c++/pod5_format_pybind/repack/repack_functions.h
================================================
#pragma once

#include "pod5_format/internal/tracing/tracing.h"
#include "pod5_format/read_table_reader.h"
#include "pod5_format/signal_builder.h"
#include "pod5_format/signal_table_schema.h"
#include "pod5_format/uuid.h"
#include "repack_utils.h"

#include <arrow/array/array_nested.h>
#include <arrow/array/array_primitive.h>
#include <arrow/array/builder_binary.h>

#include <numeric>
#include <unordered_set>

namespace repack {

struct ReadReadData {
    std::shared_ptr<pod5::FileReader> input;
    std::vector<pod5::ReadData> reads;
    std::vector<std::size_t> signal_durations;
    std::vector<std::size_t> signal_row_sizes;

    std::vector<pod5::Uuid> signal_rows_read_ids;
    std::vector<std::uint64_t> signal_rows;
};

arrow::Result<ReadReadData> read_read_data(
    ReadsTableDictionaryThreadCache & reads_table_cache,
    states::unread_read_table_rows && in_batch)
{
    POD5_TRACE_FUNCTION();

    auto const & source_file = in_batch.input;
    ARROW_ASSIGN_OR_RAISE(
        auto source_read_table_batch, source_file->read_read_record_batch(in_batch.batch_index));

    ARROW_ASSIGN_OR_RAISE(auto columns, source_read_table_batch.columns());

    auto const & pore_type_columns = columns.pore_type->indices();
    auto const & source_reads_pore_type_column =
        static_cast<arrow::Int16Array const &>(*pore_type_columns);
    auto const & end_reason_columns = columns.end_reason->indices();
    auto const & source_reads_end_reason_column =
        static_cast<arrow::Int16Array const &>(*end_reason_columns);
    auto const & run_info_columns = columns.run_info->indices();
    auto const & source_reads_run_info_column =
        static_cast<arrow::Int16Array const &>(*run_info_columns);
    auto source_reads_signal_column = source_read_table_batch.signal_column();

    auto batch_rows = std::move(in_batch.batch_rows);
    if (batch_rows.empty()) {
        auto const source_batch_row_count = source_read_table_batch.num_rows();
        batch_rows.resize(source_batch_row_count);
        std::iota(batch_rows.begin(), batch_rows.end(), 0);
    }

    ReadReadData result;
    result.input = source_file;
    result.reads.reserve(batch_rows.size());
    result.signal_rows.reserve(batch_rows.size());
    result.signal_row_sizes.reserve(batch_rows.size());
    for (std::size_t batch_row_index = 0; batch_row_index < batch_rows.size(); ++batch_row_index) {
        auto batch_row = batch_rows[batch_row_index];
        // Find the read params
        auto const & read_id = columns.read_id->Value(batch_row);
        auto const & read_number = columns.read_number->Value(batch_row);
        auto const & start_sample = columns.start_sample->Value(batch_row);
        auto const & channel = columns.channel->Value(batch_row);
        auto const & well = columns.well->Value(batch_row);
        auto const & calibration_offset = columns.calibration_offset->Value(batch_row);
        auto const & calibration_scale = columns.calibration_scale->Value(batch_row);
        auto const & median_before = columns.median_before->Value(batch_row);
        auto const & end_reason_forced = columns.end_reason_forced->Value(batch_row);
        auto const & num_minknow_events = columns.num_minknow_events->Value(batch_row);
        auto const & tracked_scaling_scale = columns.tracked_scaling_scale->Value(batch_row);
        auto const & tracked_scaling_shift = columns.tracked_scaling_shift->Value(batch_row);
        auto const & predicted_scaling_scale = columns.predicted_scaling_scale->Value(batch_row);
        auto const & predicted_scaling_shift = columns.predicted_scaling_shift->Value(batch_row);
        auto const & num_reads_since_mux_change =
            columns.num_reads_since_mux_change->Value(batch_row);
        auto const & time_since_mux_change = columns.time_since_mux_change->Value(batch_row);
        auto const & open_pore_level = columns.open_pore_level->Value(batch_row);
        auto const & num_samples = columns.num_samples->Value(batch_row);

        auto const & pore_type_index = source_reads_pore_type_column.Value(batch_row);
        auto const & end_reason_index = source_reads_end_reason_column.Value(batch_row);
        auto const & run_info_index = source_reads_run_info_column.Value(batch_row);

        ARROW_ASSIGN_OR_RAISE(
            auto dest_pore_index,
            reads_table_cache.find_pore_index(
                source_file, source_read_table_batch, pore_type_index));
        ARROW_ASSIGN_OR_RAISE(
            auto dest_run_info_index,
            reads_table_cache.find_run_info_index(
                source_file, source_read_table_batch, run_info_index));

        result.reads.emplace_back(
            read_id,
            read_number,
            start_sample,
            channel,
            well,
            dest_pore_index,
            calibration_offset,
            calibration_scale,
            median_before,
            end_reason_index,
            end_reason_forced,
            dest_run_info_index,
            num_minknow_events,
            tracked_scaling_scale,
            tracked_scaling_shift,
            predicted_scaling_scale,
            predicted_scaling_shift,
            num_reads_since_mux_change,
            time_since_mux_change,
            open_pore_level);
        result.signal_durations.emplace_back(num_samples);

        auto const signal_rows = std::static_pointer_cast<arrow::UInt64Array>(
            source_reads_signal_column->value_slice(batch_row));
        auto const signal_rows_span =
            gsl::make_span(signal_rows->raw_values(), signal_rows->length());

        result.signal_rows.insert(
            result.signal_rows.end(), signal_rows_span.begin(), signal_rows_span.end());
        for (std::size_t i = 0; i < signal_rows_span.size(); ++i) {
            result.signal_rows_read_ids.emplace_back(read_id);
        }
        result.signal_row_sizes.emplace_back(signal_rows_span.size());
    }
    return result;
}

arrow::Status read_signal(
    std::shared_ptr<pod5::FileReader> const & source_file,
    pod5::SignalType input_compression_type,
    std::uint64_t abs_signal_row,
    pod5::Uuid read_id,
    pod5::SignalType output_compression_type,
    arrow::FixedSizeBinaryBuilder & read_id_builder,
    pod5::SignalBuilderVariant & signal_builder,
    arrow::UInt32Builder & samples_builder,
    arrow::MemoryPool * pool)
{
    auto signal_rows_span = gsl::make_span(&abs_signal_row, 1);

    // If were using the same compression type in both files, just copy compressed:
    if (input_compression_type == output_compression_type
        && output_compression_type == pod5::SignalType::VbzSignal)
    {
        std::vector<uint32_t> sample_counts;
        ARROW_ASSIGN_OR_RAISE(
            auto extracted_signal,
            source_file->extract_samples_inplace(signal_rows_span, sample_counts));

        assert(1 == extracted_signal.size());
        assert(sample_counts.size() == extracted_signal.size());
        auto signal_span =
            gsl::make_span(extracted_signal.front()->data(), extracted_signal.front()->size());

        ARROW_RETURN_NOT_OK(read_id_builder.Append(read_id.data()));
        ARROW_RETURN_NOT_OK(
            std::visit(pod5::visitors::append_pre_compressed_signal{signal_span}, signal_builder));
        ARROW_RETURN_NOT_OK(samples_builder.Append(sample_counts.front()));
    } else {
        // Find the sample count of the complete read:
        ARROW_ASSIGN_OR_RAISE(
            auto sample_count, source_file->extract_sample_count(signal_rows_span));

        std::vector<std::int16_t> signal(sample_count);
        auto signal_buffer_span = gsl::make_span(signal);
        ARROW_RETURN_NOT_OK(source_file->extract_samples(signal_rows_span, signal_buffer_span));

        ARROW_RETURN_NOT_OK(read_id_builder.Append(read_id.data()));
        ARROW_RETURN_NOT_OK(
            std::visit(pod5::visitors::append_signal{signal_buffer_span, pool}, signal_builder));
        ARROW_RETURN_NOT_OK(samples_builder.Append(sample_count));
    }
    return arrow::Status::OK();
}

struct RequestedSignalReads {
    std::vector<states::shared_variant> complete_requests;
    std::shared_ptr<states::read_split_signal_table_batch_rows> partial_request;
};

arrow::Result<RequestedSignalReads> request_signal_reads(
    std::shared_ptr<pod5::FileReader> const & source_file,
    pod5::SignalType output_compression_type,
    std::size_t signal_batch_size,
    std::vector<pod5::Uuid> read_ids,
    std::vector<std::uint64_t> signal_rows,
    std::shared_ptr<states::read_split_signal_table_batch_rows> const & partial_request,
    std::shared_ptr<states::read_read_table_rows_no_signal> const & dest_read_table_rows,
    arrow::MemoryPool * pool)
{
    POD5_TRACE_FUNCTION();

    auto const input_signal_type = source_file->signal_type();

    assert(read_ids.size() == signal_rows.size());

    RequestedSignalReads result;
    auto next_request = partial_request;

    assert(signal_rows.size() == dest_read_table_rows->signal_row_indices.size());

    std::size_t signal_rows_position = 0;
    while (signal_rows_position < signal_rows.size()) {
        if (!next_request) {
            ARROW_ASSIGN_OR_RAISE(
                auto signal_builder, pod5::make_signal_builder(output_compression_type, pool));
            next_request = std::make_shared<states::read_split_signal_table_batch_rows>(
                std::move(signal_builder), pool);
            next_request->patch_rows.reserve(signal_batch_size);
        }
        auto to_write = std::min(
            signal_rows.size() - signal_rows_position,
            signal_batch_size - next_request->patch_rows.size());

        for (std::size_t i = 0; i < to_write; ++i) {
            auto const dest_batch_row_index = signal_rows_position + i;
            assert(dest_batch_row_index < signal_rows.size());
            assert(dest_batch_row_index < dest_read_table_rows->signal_row_indices.size());

            ARROW_RETURN_NOT_OK(read_signal(
                source_file,
                input_signal_type,
                signal_rows[signal_rows_position + i],
                read_ids[signal_rows_position + i],
                output_compression_type,
                *next_request->read_id_builder,
                next_request->signal_builder,
                next_request->samples_builder,
                pool));

            next_request->patch_rows.emplace_back(dest_read_table_rows, dest_batch_row_index);
        }
        signal_rows_position += to_write;

        assert(next_request->row_count() <= signal_batch_size);
        assert(next_request->row_count() <= signal_batch_size);
        if (next_request->row_count() >= signal_batch_size) {
            result.complete_requests.emplace_back(std::move(next_request));
            next_request.reset();
        }
    }

    result.partial_request = next_request;
    return result;
}

struct ReadSignal {
    std::size_t row_count;
    bool final_batch;
    std::vector<std::shared_ptr<arrow::Array>> columns;
};

arrow::Result<ReadSignal> read_signal_data(states::read_split_signal_table_batch_rows & signal_rows)
{
    POD5_TRACE_FUNCTION();

    ReadSignal result;

    pod5::SignalTableSchemaDescription field_locations;
    result.final_batch = signal_rows.final_batch;
    result.row_count = signal_rows.row_count();
    result.columns = {nullptr, nullptr, nullptr};
    ARROW_RETURN_NOT_OK(
        signal_rows.read_id_builder->Finish(&result.columns[field_locations.read_id]));
    ARROW_RETURN_NOT_OK(
        std::visit(
            pod5::visitors::finish_column{&result.columns[field_locations.signal]},
            signal_rows.signal_builder));
    ARROW_RETURN_NOT_OK(
        signal_rows.samples_builder.Finish(&result.columns[field_locations.samples]));
    return result;
}

arrow::Status write_reads(
    std::shared_ptr<pod5::FileWriter> const & output,
    std::vector<pod5::ReadData> const & reads,
    std::vector<std::size_t> const & signal_durations,
    std::vector<std::size_t> const & signal_row_sizes,
    std::vector<pod5::SignalTableRowIndex> const & signal_row_indices)
{
    POD5_TRACE_FUNCTION();
    std::size_t signal_position = 0;
    auto signal_indices_span = gsl::make_span(signal_row_indices);
    for (std::size_t i = 0; i < reads.size(); ++i) {
        auto signal_rows = signal_indices_span.subspan(signal_position, signal_row_sizes[i]);
        signal_position += signal_row_sizes[i];

        ARROW_RETURN_NOT_OK(output->add_complete_read(reads[i], signal_rows, signal_durations[i]));
    }

    return arrow::Status::OK();
}

arrow::Status check_duplicate_read_ids(
    std::unordered_set<pod5::Uuid> & output_read_ids,
    std::vector<pod5::ReadData> const & new_reads)
{
    for (auto const & read : new_reads) {
        auto result = output_read_ids.insert(read.read_id);
        if (!result.second) {
            return arrow::Status::Invalid(
                "Duplicate read id ", to_string(read.read_id), " found in file");
        }
    }

    return arrow::Status::OK();
}

}  // namespace repack


================================================
FILE: c++/pod5_format_pybind/repack/repack_output.cpp
================================================
#include "repack_output.h"

#include "pod5_format/internal/tracing/tracing.h"
#include "repack_functions.h"

#include <iostream>
#include <thread>
#include <unordered_set>

namespace repack {

namespace {
struct is_not_nullptr {
    template <typename T>
    bool operator()(T const & t) const
    {
        return t != nullptr;
    }
};

#if 0
struct get_name{
    template <typename T>
    std::string operator()(T const& t) const {
        return typeid(typename T::element_type).name();
    }
};

template <typename T>
void dump_queued_items(T const& queued) {
    std::map<std::string, std::size_t> items;

    for (auto const& item : queued) {
        items[std::visit(get_name{}, item)] += 1;
    }

    std::cout << "Queued items:\n";
    for (auto pr : items) {
        std::cout << "  " << pr.first << ": " << pr.second << "\n";
    }
}
#endif

}  // namespace

struct Pod5RepackerOutputThreadState {
    Pod5RepackerOutputThreadState(std::shared_ptr<ReadsTableDictionaryManager> const & dict_manager)
    : dict_cache(dict_manager)
    {
    }

    ReadsTableDictionaryThreadCache dict_cache;
};

struct Pod5RepackerOutputState {
    Pod5RepackerOutputState(
        std::shared_ptr<pod5::FileWriter> const & _output_file,
        bool _check_duplicate_read_ids,
        arrow::MemoryPool * _memory_pool)
    : output_file(_output_file)
    , check_duplicate_read_ids(_check_duplicate_read_ids)
    , memory_pool(_memory_pool)
    , dict_manager(
          std::make_shared<ReadsTableDictionaryManager>(_output_file, read_table_writer_mutex))
    {
    }

    Pod5RepackerOutputThreadState * get_thread_state()
    {
        std::lock_guard<std::mutex> l{thread_states_mutex};
        auto it = thread_states.find(std::this_thread::get_id());
        if (it == thread_states.end()) {
            it = thread_states.emplace(std::this_thread::get_id(), dict_manager).first;
        }
        return &it->second;
    }

    std::shared_ptr<pod5::FileWriter> output_file;
    bool check_duplicate_read_ids;
    arrow::MemoryPool * memory_pool;
    std::mutex read_table_writer_mutex;
    std::mutex signal_table_writer_mutex;
    std::shared_ptr<ReadsTableDictionaryManager> dict_manager;
    std::mutex partial_signal_batch_mutex;
    std::shared_ptr<states::read_split_signal_table_batch_rows> partial_signal_batch;
    std::atomic<std::size_t> reads_completed{0};

    std::mutex thread_states_mutex;
    std::unordered_map<std::thread::id, Pod5RepackerOutputThreadState> thread_states;

    std::mutex output_read_ids_mutex;
    std::unordered_set<pod5::Uuid> output_read_ids;
};

namespace {

struct StateProgressResult {
    StateProgressResult() = default;

    StateProgressResult(std::vector<states::shared_variant> && _new_states)
    : new_states(_new_states)
    {
    }

    std::vector<states::shared_variant> new_states;
};

struct StateOperator {
    StateOperator(Pod5RepackerOutputState * _progress_state) : progress_state(_progress_state) {}

    arrow::Result<StateProgressResult> operator()(
        std::shared_ptr<states::unread_read_table_rows> & batch) const
    {
        POD5_TRACE_FUNCTION();

        // Read out the read table data from the source file
        ARROW_ASSIGN_OR_RAISE(
            auto read_result,
            read_read_data(progress_state->get_thread_state()->dict_cache, std::move(*batch)));
        batch.reset();

        auto read_table_rows = std::make_shared<states::read_read_table_rows_no_signal>();
        read_table_rows->reads = std::move(read_result.reads);
        read_table_rows->signal_durations = std::move(read_result.signal_durations);
        read_table_rows->signal_row_sizes = std::move(read_result.signal_row_sizes);
        read_table_rows->signal_row_indices.resize(read_result.signal_rows.size());

        if (progress_state->check_duplicate_read_ids) {
            std::lock_guard<std::mutex> l{progress_state->output_read_ids_mutex};
            ARROW_RETURN_NOT_OK(
                check_duplicate_read_ids(progress_state->output_read_ids, read_table_rows->reads));
        }

        // Split the read table rows into new signal table batches:
        {
            std::lock_guard<std::mutex> l{progress_state->partial_signal_batch_mutex};
            ARROW_ASSIGN_OR_RAISE(
                auto signal_request_result,
                request_signal_reads(
                    read_result.input,
                    progress_state->output_file->signal_type(),
                    progress_state->output_file->signal_table_batch_size(),
                    read_result.signal_rows_read_ids,
                    read_result.signal_rows,
                    progress_state->partial_signal_batch,
                    read_table_rows,
                    progress_state->memory_pool));

            progress_state->partial_signal_batch = signal_request_result.partial_request;
            return StateProgressResult{std::move(signal_request_result.complete_requests)};
        }
    }

    arrow::Result<StateProgressResult> operator()(
        std::shared_ptr<states::read_split_signal_table_batch_rows> & batch) const
    {
        POD5_TRACE_FUNCTION();

        ARROW_ASSIGN_OR_RAISE(auto read_signal_result, read_signal_data(*batch));

        std::pair<pod5::SignalTableRowIndex, pod5::SignalTableRowIndex> inserted_signal_rows;
        {
            std::lock_guard<std::mutex> l(progress_state->signal_table_writer_mutex);
            ARROW_ASSIGN_OR_RAISE(
                inserted_signal_rows,
                progress_state->output_file->add_signal_batch(
                    read_signal_result.row_count,
                    std::move(read_signal_result.columns),
                    read_signal_result.final_batch));
        }

        std::vector<states::shared_variant> result_new_states;

        for (std::size_t i = 0; i < batch->patch_rows.size(); ++i) {
            auto const & row = batch->patch_rows[i];

            auto const & dest_read_table = row.dest_read_table;
            assert(dest_read_table);
            assert(row.dest_batch_row_index < dest_read_table->signal_row_indices.size());
            dest_read_table->signal_row_indices[row.dest_batch_row_index] =
                inserted_signal_rows.first + i;
            dest_read_table->written_row_indices += 1;

            // Check if this read table is completed!
            if (dest_read_table->written_row_indices > dest_read_table->signal_row_indices.size()) {
                assert(false);
            }
            if (dest_read_table->written_row_indices == dest_read_table->signal_row_indices.size())
            {
                result_new_states.push_back(dest_read_table);
            }
        }

        return StateProgressResult{std::move(result_new_states)};
    }

    arrow::Result<StateProgressResult> operator()(
        std::shared_ptr<states::read_read_table_rows_no_signal> & batch) const
    {
        POD5_TRACE_FUNCTION();
        assert(batch->written_row_indices == batch->signal_row_indices.size());

        std::lock_guard<std::mutex> l(progress_state->read_table_writer_mutex);
        ARROW_RETURN_NOT_OK(write_reads(
            progress_state->output_file,
            batch->reads,
            batch->signal_durations,
            batch->signal_row_sizes,
            batch->signal_row_indices));
        progress_state->reads_completed += batch->reads.size();

        return StateProgressResult{{}};
    }

    arrow::Result<StateProgressResult> operator()(std::shared_ptr<states::finished> & batch) const
    {
        POD5_TRACE_FUNCTION();

        std::vector<states::shared_variant> final_states;
        // No further reads expected, flush all partial state:
        std::lock_guard<std::mutex> l{progress_state->partial_signal_batch_mutex};
        if (progress_state->partial_signal_batch) {
            progress_state->partial_signal_batch->final_batch = true;

            final_states.emplace_back(std::move(progress_state->partial_signal_batch));
            progress_state->partial_signal_batch.reset();
        }

        return StateProgressResult{std::move(final_states)};
    }

    Pod5RepackerOutputState * progress_state;
};

}  // namespace

Pod5RepackerOutput::Pod5RepackerOutput(
    std::shared_ptr<Pod5Repacker> const & repacker,
    std::shared_ptr<pod5::ThreadPool> thread_pool,
    std::shared_ptr<pod5::FileWriter> const & output,
    bool check_duplicate_read_ids)
: m_repacker(repacker)
, m_thread_pool(thread_pool)
, m_output(output)
, m_progress_state(
      std::make_unique<Pod5RepackerOutputState>(
          output,
          check_duplicate_read_ids,
          arrow::default_memory_pool()))
{
}

Pod5RepackerOutput::~Pod5RepackerOutput() {}

bool Pod5RepackerOutput::has_tasks() const
{
    if (m_in_flight > 0) {
        return true;
    }
    std::lock_guard<std::mutex> l{m_active_read_table_states_mutex};
    return m_active_read_table_states.size() > 0;
}

void Pod5RepackerOutput::set_finished()
{
    if (!m_finished) {
        // Wait for all other tasks to flush through the output.
        while (!m_has_error) {
            if (!has_tasks()) {
                break;
            }

            std::this_thread::sleep_for(std::chrono::milliseconds(1));
        }

        {
            std::lock_guard<std::mutex> l{m_active_read_table_states_mutex};
            m_active_read_table_states.emplace_front(std::make_shared<states::finished>());
        }
        post_try_work();

        m_finished = true;
    }
}

bool Pod5RepackerOutput::is_complete() const
{
    if (!m_finished) {
        return false;
    }
    std::lock_guard<std::mutex> l{m_active_read_table_states_mutex};
    return m_active_read_table_states.empty();
}

std::size_t Pod5RepackerOutput::reads_completed() const
{
    return m_progress_state->reads_completed;
}

void Pod5RepackerOutput::register_new_reads(
    std::shared_ptr<pod5::FileReader> const & input,
    std::size_t batch_index,
    std::vector<std::uint32_t> && batch_rows)
{
    if (m_finished) {
        throw std::runtime_error("Failed to add reads to finished output");
    }

    {
        std::lock_guard<std::mutex> l{m_active_read_table_states_mutex};
        m_active_read_table_states.emplace_front(
            std::make_shared<states::unread_read_table_rows>(
                input, batch_index, std::move(batch_rows)));
    }

    post_try_work();
}

void Pod5RepackerOutput::post_try_work()
{
    m_thread_pool->post([&]() {
        POD5_TRACE_FUNCTION();

        auto get_next_work = [](auto & locked_states) -> states::shared_variant {
            if (locked_states.empty()) {
                return {};
            }

            auto work = locked_states.back();
            locked_states.pop_back();
            return work;
        };

        StateOperator state_operator{m_progress_state.get()};

        states::shared_variant next_work;
        while (!m_has_error) {
            m_in_flight += 1;
            // Its important we don't release this until any new states
            // are in `m_active_read_table_states`
            auto remove_in_flight = gsl::finally([&] { m_in_flight -= 1; });

            if (!std::visit(is_not_nullptr{}, next_work)) {
                std::lock_guard<std::mutex> l{m_active_read_table_states_mutex};
                next_work = get_next_work(m_active_read_table_states);
                if (!std::visit(is_not_nullptr{}, next_work)) {
                    return;
                }
            }

            auto result = std::visit(state_operator, next_work);
            if (!result.ok()) {
                set_error(result.status());
                return;
            }
            next_work = {};

            {
                std::lock_guard<std::mutex> l{m_active_read_table_states_mutex};
                auto && states = m_active_read_table_states;
                states.insert(states.end(), result->new_states.begin(), result->new_states.end());

                next_work = get_next_work(states);
            }
        }
    });
}

}  // namespace repack


================================================
FILE: c++/pod5_format_pybind/repack/repack_output.h
================================================
#pragma once

#include "pod5_format/file_writer.h"
#include "pod5_format/thread_pool.h"
#include "repack_states.h"

#include <atomic>
#include <deque>
#include <memory>
#include <mutex>
#include <vector>

namespace repack {

class Pod5Repacker;

struct Pod5RepackerOutputState;

class Pod5RepackerOutput {
public:
    Pod5RepackerOutput(
        std::shared_ptr<Pod5Repacker> const & repacker,
        std::shared_ptr<pod5::ThreadPool> thread_pool,
        std::shared_ptr<pod5::FileWriter> const & output,
        bool check_duplicate_read_ids);
    ~Pod5RepackerOutput();

    std::string path() const { return m_output->path(); }

    std::shared_ptr<Pod5Repacker> const & repacker() const { return m_repacker; }

    bool has_tasks() const;

    arrow::Status error()
    {
        std::lock_guard<std::mutex> l{m_error_mutex};
        return m_error;
    }

    bool has_error() const { return m_has_error.load(); }

    // Inform the output no further reads will be added
    void set_finished();

    // Check if the output has completed all writes
    bool is_complete() const;

    // Number of reads completed
    std::size_t reads_completed() const;

    // Register new writes to the output, should not be called after #set_reads_finished
    void register_new_reads(
        std::shared_ptr<pod5::FileReader> const & input,
        std::size_t batch_index,
        std::vector<std::uint32_t> && batch_rows = {}  // All rows by default
    );

private:
    void post_try_work();

    void set_error(arrow::Status error)
    {
        assert(!error.ok());
        {
            std::lock_guard<std::mutex> l{m_error_mutex};
            m_error = std::move(error);
        }
        m_has_error = true;
    }

    std::shared_ptr<Pod5Repacker> m_repacker;
    std::shared_ptr<pod5::ThreadPool> m_thread_pool;
    std::shared_ptr<pod5::FileWriter> m_output;
    std::atomic<bool> m_finished{false};

    std::atomic<bool> m_has_error{false};
    std::mutex m_error_mutex;
    arrow::Status m_error;

    std::atomic<std::size_t> m_in_flight{0};
    mutable std::mutex m_active_read_table_states_mutex;
    std::deque<states::shared_variant> m_active_read_table_states;

    std::unique_ptr<Pod5RepackerOutputState> m_progress_state;
};

}  // namespace repack


================================================
FILE: c++/pod5_format_pybind/repack/repack_states.h
================================================
#pragma once

#include "pod5_format/file_reader.h"
#include "pod5_format/signal_builder.h"

#include <arrow/array/builder_binary.h>
#include <arrow/array/builder_primitive.h>

#include <cstddef>
#include <cstdint>
#include <variant>
#include <vector>

namespace repack { namespace states {

class unread_read_table_rows {
public:
    unread_read_table_rows(
        std::shared_ptr<pod5::FileReader> const & _input,
        std::size_t _batch_index,
        std::vector<std::uint32_t> && _batch_rows)
    : input(_input)
    , batch_index(_batch_index)
    , batch_rows(std::move(_batch_rows))
    {
    }

    std::shared_ptr<pod5::FileReader> input;
    std::size_t batch_index;
    std::vector<std::uint32_t> batch_rows;
};

class read_read_table_rows_no_signal {
public:
    std::vector<pod5::ReadData> reads;
    std::vector<std::size_t> signal_durations;
    std::vector<std::size_t> signal_row_sizes;

    std::atomic<std::size_t> written_row_indices{0};
    std::vector<pod5::SignalTableRowIndex> signal_row_indices;
};

class read_split_signal_table_batch_rows {
public:
    struct PatchRecord {
        PatchRecord(
            std::shared_ptr<states::read_read_table_rows_no_signal> dest_read_table,
            std::uint64_t dest_batch_row_index)
        : dest_read_table(dest_read_table)
        , dest_batch_row_index(dest_batch_row_index)
        {
        }

        std::shared_ptr<states::read_read_table_rows_no_signal> dest_read_table;
        std::uint64_t dest_batch_row_index;
    };

    read_split_signal_table_batch_rows(
        pod5::SignalBuilderVariant && signal_builder,
        arrow::MemoryPool * pool)
    : read_id_builder(pod5::make_read_id_builder(pool))
    , signal_builder(std::move(signal_builder))
    , samples_builder(pool)
    {
    }

    std::unique_ptr<arrow::FixedSizeBinaryBuilder> read_id_builder;
    pod5::SignalBuilderVariant signal_builder;
    arrow::UInt32Builder samples_builder;

    std::vector<PatchRecord> patch_rows;
    bool final_batch = false;

    std::size_t row_count() const { return patch_rows.size(); }
};

struct finished {};

using shared_variant = std::variant<
    std::shared_ptr<unread_read_table_rows>,
    std::shared_ptr<read_split_signal_table_batch_rows>,
    std::shared_ptr<read_read_table_rows_no_signal>,
    std::shared_ptr<finished>>;

}}  // namespace repack::states


================================================
FILE: c++/pod5_format_pybind/repack/repack_utils.h
================================================
#pragma once

#include "pod5_format/read_table_reader.h"

#include <arrow/array/array_dict.h>

#include <mutex>
#include <unordered_map>

namespace repack {

struct pair_hasher {
    template <class T1, class T2>
    std::size_t operator()(std::pair<T1, T2> const & pair) const
    {
        return std::hash<T1>{}(pair.first) ^ std::hash<T2>{}(pair.second);
    }
};

struct run_info_hasher {
    std::size_t operator()(pod5::RunInfoData const & run_info) const
    {
        return std::hash<std::string>{}(run_info.acquisition_id);
    }
};

class ReadsTableDictionaryManager {
public:
    ReadsTableDictionaryManager(
        std::shared_ptr<pod5::FileWriter> const & output_file,
        std::mutex & writer_mutex)
    : m_output_file(output_file)
    , m_writer_mutex(writer_mutex)
    {
    }

    // Find or create a pore index in the output file - expects to run on strand.
    arrow::Result<pod5::PoreDictionaryIndex> find_pore_index(
        std::shared_ptr<pod5::FileReader> const & source_file,
        pod5::ReadTableRecordBatch const & source_batch,
        pod5::PoreDictionaryIndex source_index)
    {
        std::lock_guard<std::mutex> l(m_writer_mutex);

        ARROW_ASSIGN_OR_RAISE(auto source_data, source_batch.get_pore_type(source_index));
        pod5::PoreDictionaryIndex dest_index = 0;

        // See if we have the same run info by value stored in the file:
        auto data_lookup_it = m_pore_data_indexes.find(source_data);
        if (data_lookup_it != m_pore_data_indexes.end()) {
            dest_index = data_lookup_it->second;
        } else {
            ARROW_ASSIGN_OR_RAISE(dest_index, m_output_file->add_pore_type(source_data));
        }

        m_pore_data_indexes[source_data] = dest_index;
        return dest_index;
    }

    // Find or create a run_info index in the output file - expects to run on strand.
    arrow::Result<pod5::RunInfoDictionaryIndex> find_run_info_index(
        std::shared_ptr<pod5::FileReader> const & source_file,
        pod5::ReadTableRecordBatch const & source_batch,
        pod5::RunInfoDictionaryIndex source_index)
    {
        std::lock_guard<std::mutex> l(m_writer_mutex);

        ARROW_ASSIGN_OR_RAISE(auto source_data, source_batch.get_run_info(source_index));
        ARROW_ASSIGN_OR_RAISE(auto const run_info, source_file->find_run_info(source_data));
        pod5::RunInfoDictionaryIndex dest_index = 0;

        // See if we have the same run info by value stored in the file:
        auto data_lookup_it = m_run_info_data_indexes.find(*run_info);
        if (data_lookup_it != m_run_info_data_indexes.end()) {
            dest_index = data_lookup_it->second;
        } else {
            ARROW_ASSIGN_OR_RAISE(dest_index, m_output_file->add_run_info(*run_info));
        }

        m_run_info_data_indexes[*run_info] = dest_index;
        return dest_index;
    }

private:
    std::shared_ptr<pod5::FileWriter> m_output_file;

    std::mutex & m_writer_mutex;

    std::unordered_map<std::string, pod5::PoreDictionaryIndex> m_pore_data_indexes;
    std::unordered_map<pod5::RunInfoData, pod5::RunInfoDictionaryIndex, run_info_hasher>
        m_run_info_data_indexes;
};

class ReadsTableDictionaryThreadCache {
public:
    ReadsTableDictionaryThreadCache(std::shared_ptr<ReadsTableDictionaryManager> const & main_cache)
    : m_main_cache(main_cache)
    {
    }

    // Find or create a pore index in the output file - expects to run on strand.
    arrow::Result<pod5::PoreDictionaryIndex> find_pore_index(
        std::shared_ptr<pod5::FileReader> const & source_file,
        pod5::ReadTableRecordBatch const & source_batch,
        pod5::PoreDictionaryIndex source_index)
    {
        auto const key = std::make_pair(make_file_key(source_file), source_index);
        auto const it = m_pore_indexes.find(key);
        if (it != m_pore_indexes.end()) {
            return it->second;
        }

        ARROW_ASSIGN_OR_RAISE(
            auto dest_index,
            m_main_cache->find_pore_index(source_file, source_batch, source_index));
        m_pore_indexes[key] = dest_index;
        return dest_index;
    }

    // Find or create a run_info index in the output file - expects to run on strand.
    arrow::Result<pod5::RunInfoDictionaryIndex> find_run_info_index(
        std::shared_ptr<pod5::FileReader> const & source_file,
        pod5::ReadTableRecordBatch const & source_batch,
        pod5::RunInfoDictionaryIndex source_index)
    {
        auto const key = std::make_pair(make_file_key(source_file), source_index);
        auto const it = m_run_info_indexes.find(key);
        if (it != m_run_info_indexes.end()) {
            return it->second;
        }

        ARROW_ASSIGN_OR_RAISE(
            auto dest_index,
            m_main_cache->find_run_info_index(source_file, source_batch, source_index));
        m_run_info_indexes[key] = dest_index;
        return dest_index;
    }

private:
    using FileKey = std::uint64_t;

    FileKey make_file_key(std::shared_ptr<pod5::FileReader> const & file)
    {
        return reinterpret_cast<FileKey>(file.get());
    }

    template <typename IndexType>
    using DictionaryLookup =
        std::unordered_map<std::pair<FileKey, IndexType>, IndexType, pair_hasher>;

    std::shared_ptr<ReadsTableDictionaryManager> m_main_cache;

    DictionaryLookup<pod5::PoreDictionaryIndex> m_pore_indexes;
    DictionaryLookup<pod5::RunInfoDictionaryIndex> m_run_info_indexes;
};

}  // namespace repack


================================================
FILE: c++/pod5_format_pybind/repack/repacker.cpp
================================================
#include "repacker.h"

#include "pod5_format/internal/tracing/tracing.h"
#include "repack_output.h"
#include "repack_states.h"

namespace repack {

namespace {

void repacker_add_reads_preconditions(
    std::shared_ptr<Pod5Repacker> const & repacker,
    std::shared_ptr<Pod5RepackerOutput> const & output,
    Pod5FileReaderPtr const & input)
{
    if (output->repacker() != repacker) {
        throw std::runtime_error("Invalid repacker output passed, created by another repacker");
    }

    if (!input.reader) {
        throw std::runtime_error("Invalid input passed to repacker, no reader");
    }
}

}  // namespace

Pod5Repacker::Pod5Repacker() : m_thread_pool{pod5::make_thread_pool(10)} {}

Pod5Repacker::~Pod5Repacker() { finish(); }

void Pod5Repacker::finish()
{
    POD5_TRACE_FUNCTION();
    for (auto & output : m_outputs) {
        output->set_finished();
    }

    check_for_error();

    m_thread_pool->stop_and_drain();

    for (auto & output : m_outputs) {
        m_reads_complete_deleted_outputs += output->reads_completed();
    }
    m_outputs.clear();
}

std::shared_ptr<Pod5RepackerOutput> Pod5Repacker::add_output(
    std::shared_ptr<pod5::FileWriter> const & output,
    bool check_duplicate_read_ids)
{
    POD5_TRACE_FUNCTION();
    auto repacker_output = std::make_shared<Pod5RepackerOutput>(
        shared_from_this(), m_thread_pool, output, check_duplicate_read_ids);
    m_outputs.push_back(repacker_output);
    return repacker_output;
}

void Pod5Repacker::set_output_finished(std::shared_ptr<Pod5RepackerOutput> const & output)
{
    if (output->repacker() != shared_from_this()) {
        throw std::runtime_error("Invalid repacker output passed, created by another repacker");
    }

    output->set_finished();
}

void Pod5Repacker::add_all_reads_to_output(
    std::shared_ptr<Pod5RepackerOutput> const & output,
    Pod5FileReaderPtr const & input)
{
    POD5_TRACE_FUNCTION();
    repacker_add_reads_preconditions(shared_from_this(), output, input);

    for (std::size_t i = 0; i < input.reader->num_read_record_batches(); ++i) {
        output->register_new_reads(input.reader, i);
    }

    register_submitted_reader(input.reader);
}

void Pod5Repacker::py_add_selected_reads_to_output(
    std::shared_ptr<Pod5RepackerOutput> const & output,
    Pod5FileReaderPtr const & input,
    py::array_t<std::uint32_t, py::array::c_style | py::array::forcecast> && batch_counts,
    py::array_t<std::uint32_t, py::array::c_style | py::array::forcecast> && all_batch_rows)
{
    repacker_add_reads_preconditions(shared_from_this(), output, input);

    auto batch_counts_span = gsl::make_span(batch_counts.data(), batch_counts.size());
    auto all_batch_rows_span = gsl::make_span(all_batch_rows.data(), all_batch_rows.size());

    add_selected_reads_to_output(output, input.reader, batch_counts_span, all_batch_rows_span);
}

void Pod5Repacker::add_selected_reads_to_output(
    std::shared_ptr<Pod5RepackerOutput> const & output,
    std::shared_ptr<pod5::FileReader> const & input,
    gsl::span<std::uint32_t const> batch_counts_span,
    gsl::span<std::uint32_t const> all_batch_rows_span)
{
    POD5_TRACE_FUNCTION();

    std::size_t current_start_point = 0;
    for (std::size_t i = 0; i < input->num_read_record_batches(); ++i) {
        std::vector<std::uint32_t> batch_rows;
        auto const batch_rows_span =
            all_batch_rows_span.subspan(current_start_point, batch_counts_span[i]);

        // If this batch has no selected
        if (batch_rows_span.empty()) {
            continue;
        }

        batch_rows.insert(batch_rows.end(), batch_rows_span.begin(), batch_rows_span.end());
        current_start_point += batch_counts_span[i];

        output->register_new_reads(input, i, std::move(batch_rows));
    }

    register_submitted_reader(input);
}

void Pod5Repacker::check_for_error() const
{
    for (auto const & output : m_outputs) {
        if (output->has_error()) {
            throw std::runtime_error(output->error().ToString());
        }
    }
}

bool Pod5Repacker::is_complete() const
{
    POD5_TRACE_FUNCTION();
    check_for_error();

    for (auto const & output : m_outputs) {
        if (!output->is_complete()) {
            return false;
        }
    }

    return true;
}

std::size_t Pod5Repacker::reads_completed() const
{
    POD5_TRACE_FUNCTION();
    check_for_error();

    std::size_t reads_complete = 0;
    for (auto const & output : m_outputs) {
        reads_complete += output->reads_completed();
    }

    return reads_complete + m_reads_complete_deleted_outputs;
}

}  // namespace repack


================================================
FILE: c++/pod5_format_pybind/repack/repacker.h
================================================
#pragma once

#include "pod5_format_pybind/api.h"

#include <pybind11/pybind11.h>

#include <memory>
#include <set>
#include <vector>

namespace repack {

class Pod5RepackerOutput;

class Pod5Repacker : public std::enable_shared_from_this<Pod5Repacker> {
public:
    Pod5Repacker();
    ~Pod5Repacker();

    void finish();

    std::shared_ptr<Pod5RepackerOutput> add_output(
        std::shared_ptr<pod5::FileWriter> const & output,
        bool check_duplicate_read_ids);
    void set_output_finished(std::shared_ptr<Pod5RepackerOutput> const & output);

    void add_all_reads_to_output(
        std::shared_ptr<Pod5RepackerOutput> const & output,
        Pod5FileReaderPtr const & input);

    void py_add_selected_reads_to_output(
        std::shared_ptr<Pod5RepackerOutput> const & output,
        Pod5FileReaderPtr const & input,
        py::array_t<std::uint32_t, py::array::c_style | py::array::forcecast> && batch_counts,
        py::array_t<std::uint32_t, py::array::c_style | py::array::forcecast> && all_batch_rows);

    void add_selected_reads_to_output(
        std::shared_ptr<Pod5RepackerOutput> const & output,
        std::shared_ptr<pod5::FileReader> const & input,
        gsl::span<std::uint32_t const> batch_counts,
        gsl::span<std::uint32_t const> all_batch_rows);

    bool is_complete() const;
    std::size_t reads_completed() const;

    std::size_t currently_open_file_reader_count()
    {
        check_for_error();
        cleanup_submitted_readers();
        return m_file_readers.size();
    }

private:
    void check_for_error() const;

    void cleanup_submitted_readers()
    {
        std::erase_if(m_file_readers, [](auto const & ptr) { return ptr.expired(); });
    }

    void register_submitted_reader(std::shared_ptr<pod5::FileReader> const & input)
    {
        cleanup_submitted_readers();
        m_file_readers.insert(input);
    }

    std::shared_ptr<pod5::ThreadPool> m_thread_pool;
    std::set<std::weak_ptr<pod5::FileReader>, std::owner_less<>> m_file_readers;
    std::vector<std::shared_ptr<Pod5RepackerOutput>> m_outputs;

    std::size_t m_reads_complete_deleted_outputs{0};
};

}  // namespace repack


================================================
FILE: c++/pod5_format_pybind/subset.cpp
================================================
#include "subset.h"

#include <algorithm>
#include <chrono>
#include <cmath>
#include <cstddef>
#include <cstdlib>
#include <limits>
#include <ostream>
#include <string>

#ifndef _WIN32
#include <sys/resource.h>
#include <unistd.h>
#else
#include <io.h>

#include <cstdio>  // _getmaxstdio
#endif

#include "pod5_format/file_reader.h"
#include "pod5_format/file_writer.h"
#include "pod5_format/schema_metadata.h"
#include "repack/repacker.h"

#include <iostream>

namespace io_limits {

// Balance the number of open inputs by the output-side handle usage.
// Prefer outputs over inputs to reduce the number of output
// batches which iterate over all inputs.
constexpr std::float_t kOutputsBias = 0.7f;
constexpr std::size_t kMinHandles = 1;
constexpr std::size_t kBaseReserve = 16;

std::size_t clamp_open_inputs(std::size_t soft_limit, std::size_t output_files)
{
    constexpr std::size_t kMaxInHandles = 256;
    std::size_t const reserve = kBaseReserve + output_files;
    if (soft_limit <= reserve + kMinHandles) {
        return kMinHandles;
    }
    return std::clamp(soft_limit - reserve, kMinHandles, kMaxInHandles);
}

std::size_t clamp_open_outputs(std::size_t soft_limit)
{
    constexpr std::size_t kMaxOutHandles = 4096;
    std::size_t const reserve = kBaseReserve + kMinHandles;
    if (soft_limit <= reserve + kMinHandles) {
        return kMinHandles;
    }
    std::size_t soft_upper = (std::size_t)(soft_limit * kOutputsBias);
    if (soft_upper > 32) {
        soft_upper = (soft_upper / 16) * 16;
    }

    return std::clamp(std::min(soft_limit - reserve, soft_upper), kMinHandles, kMaxOutHandles);
}

std::size_t detect_soft_limit()
{
    //
    constexpr std::size_t kSoftLimitFallback = 1024;

#ifndef _WIN32
    // Attempt to get the resource limits (if any)
    struct rlimit rl{};
    if (getrlimit(RLIMIT_NOFILE, &rl) == 0 && rl.rlim_cur != RLIM_INFINITY) {
        return static_cast<std::size_t>(rl.rlim_cur);
    }
    long sc = sysconf(_SC_OPEN_MAX);
    return sc > 0 ? static_cast<std::size_t>(sc) : kSoftLimitFallback;
#else
    // Only stdio stream limit, not a true OS handle limit.
    int n = _getmaxstdio();
    return n > 0 ? static_cast<std::size_t>(n) : kSoftLimitFallback;
#endif
}
}  // namespace io_limits

/// \brief Simple progress bar for console applications
class ProgressBar {
public:
    static constexpr int PB_WIDTH = 60;

    ProgressBar() {}

    ~ProgressBar() { std::fputs("\n", stdout); }

    void set_task(std::string const & task_name)
    {
        m_task = task_name;
        print_progress();
    }

    void update_max_steps(std::size_t max_steps) { this->m_max_steps = max_steps; }

    void update(std::size_t current_step)
    {
        if (current_step == m_current_step) {
            return;
        }
        m_current_step = current_step;
        print_progress();
    }

    void print_progress()
    {
        float complete_ratio = static_cast<float>(m_current_step) / static_cast<float>(m_max_steps);
        int complete_length = static_cast<int>(complete_ratio * PB_WIDTH);
        std::string complete_string{"\r["};
        for (int i = 0; i < PB_WIDTH; ++i) {
            if (i < complete_length) {
                complete_string += "=";
            } else {
                complete_string += " ";
            }
        }
        complete_string += "] (" + std::to_string(m_current_step) + "/"
                           + std::to_string(m_max_steps) + ") " + m_task;
        m_max_printed_width = std::max<std::size_t>(m_max_printed_width, complete_string.size());
        // Pad to max width to overwrite previous longer lines
        complete_string.resize(m_max_printed_width, ' ');
        std::cout << complete_string.c_str() << std::flush;
    }

private:
    std::string m_task;
    std::size_t m_max_steps{0};
    std::size_t m_current_step{0};
    std::size_t m_max_printed_width{0};
};

void subset_pod5s_with_mapping(
    std::vector<std::filesystem::path> inputs,
    std::filesystem::path output,
    std::map<std::string, std::vector<std::string>> read_id_to_dest,
    bool missing_ok,
    bool duplicate_ok,
    bool force_overwrite)
{
    auto next_interrupt_check = std::chrono::steady_clock::now();
    auto poll_python_interrupt = [&]() {
        auto const now = std::chrono::steady_clock::now();
        if (now < next_interrupt_check) {
            return;
        }
        next_interrupt_check = now + std::chrono::milliseconds(500);

        pybind11::gil_scoped_acquire gil;
        if (PyErr_CheckSignals() != 0) {
            throw pybind11::error_already_set();
        }
    };

    struct OutputInfo {
        OutputInfo(std::shared_ptr<repack::Pod5RepackerOutput> && repacker_output_)
        : repacker_output(std::move(repacker_output_))
        {
        }

        std::shared_ptr<repack::Pod5RepackerOutput> repacker_output;

        void clear_per_input_working_data()
        {
            batch_counts.clear();
            all_batch_rows.clear();
            batch_counts.reserve(32);
            all_batch_rows.reserve(128);
        }

        void add_row(std::uint32_t row_index)
        {
            all_batch_rows.push_back(row_index);
            next_batch_size += 1;
        }

        void finish_batch()
        {
            batch_counts.push_back(next_batch_size);
            next_batch_size = 0;
        }

        // Per file working vectors:
        std::uint32_t next_batch_size = 0;
        std::vector<std::uint32_t> batch_counts;
        std::vector<std::uint32_t> all_batch_rows;
    };

    pod5::FileWriterOptions output_options{};
    output_options.set_keep_signal_file_open(false);
    output_options.set_keep_read_table_file_open(false);
    output_options.set_keep_run_info_file_open(false);
    pod5::FileReaderOptions input_options{};
    input_options.set_force_disable_file_mapping(true);

    // Process inputs in deterministic lexical path order.
    std::sort(inputs.begin(), inputs.end());

    std::vector<std::filesystem::path> created_output_files;
    auto cleanup = gsl::finally([&]() {
        for (auto const & path : created_output_files) {
            std::error_code ec;
            std::filesystem::remove(path, ec);
        }
    });

    bool issued_migration_warning = false;
    std::size_t const io_soft_limit = io_limits::detect_soft_limit();
    std::size_t const max_out_size = io_limits::clamp_open_outputs(io_soft_limit);

    // Create indexable view of the map iterators so we can conveniently index in batches.
    std::vector<std::map<std::string, std::vector<std::string>>::const_iterator> read_id_dest_iters;
    read_id_dest_iters.reserve(read_id_to_dest.size());
    std::size_t total_requested_read_ids = 0;
    for (auto it = read_id_to_dest.begin(); it != read_id_to_dest.end(); ++it) {
        poll_python_interrupt();

        // Check we're not unintentionally overwriting files
        auto const output_path = output / it->first;
        if (std::filesystem::exists(output_path)) {
            if (!force_overwrite) {
                throw std::runtime_error(
                    "Output files already exists and --force-overwrite not set. ");
            } else {
                std::filesystem::remove(output_path);
            }
        }

        // Index the map iterator and tally total reads
        read_id_dest_iters.push_back(it);
        total_requested_read_ids += it->second.size();
    }

    std::size_t found_read_count = 0;
    std::size_t total_reads_completed = 0;

    std::size_t const total_output_batches =
        (read_id_dest_iters.size() + max_out_size - 1) / max_out_size;

    if (total_output_batches > 1) {
        std::cerr << "Subsetting inputs into " << std::to_string(read_id_dest_iters.size())
                  << " files in " << std::to_string(total_output_batches) << " batches of at most "
                  << max_out_size << " outputs. IO limit: " << std::to_string(io_soft_limit)
                  << std::endl;
    }

    ProgressBar progress_bar;
    progress_bar.set_task("Starting...");
    progress_bar.update_max_steps(total_requested_read_ids);

    // Iterate over outputs in batches
    for (std::size_t out_st = 0; out_st < read_id_dest_iters.size(); out_st += max_out_size) {
        poll_python_interrupt();
        std::size_t const output_batch_index = (out_st / max_out_size) + 1;
        std::size_t const out_end = std::min(out_st + max_out_size, read_id_dest_iters.size());
        std::string const batch_prefix = "Batch [" + std::to_string(output_batch_index) + "/"
                                         + std::to_string(total_output_batches) + "]: ";

        auto repacker = std::make_shared<repack::Pod5Repacker>();
        std::unordered_multimap<pod5::Uuid, std::uint32_t> read_id_lookup;
        std::vector<OutputInfo> dest_to_output;
        dest_to_output.reserve(out_end - out_st);

        // For each output in this batch
        for (std::size_t out_idx = out_st; out_idx < out_end; ++out_idx) {
            poll_python_interrupt();
            auto const & read_id_dest = *read_id_dest_iters[out_idx];
            auto const output_path = output / read_id_dest.first;

            // Create the output file
            auto writer =
                pod5::create_file_writer(output_path.string(), "pod5_subset", output_options);
            if (!writer.ok()) {
                std::cerr << "Failed to create output file: " << output_path << std::endl;
                throw std::runtime_error("Failed to create output POD5 file");
            }

            // Add the output file writer to the repacker
            created_output_files.push_back(output_path);
            auto repacker_output_file = repacker->add_output(std::move(*writer), !duplicate_ok);
            std::size_t const repacker_output_idx = dest_to_output.size();
            dest_to_output.emplace_back(std::move(repacker_output_file));

            // Associate the requested read_ids to this output
            for (auto const & read_id : read_id_dest.second) {
                auto read_id_uuid = pod5::Uuid::from_string(read_id);
                if (!read_id_uuid) {
                    std::cerr << "Invalid read id uuid: " << read_id << std::endl;
                    throw std::runtime_error("Invalid read id uuid in mapping");
                }
                read_id_lookup.insert(std::make_pair(*read_id_uuid, repacker_output_idx));
            }
        }

        // Scale the max open input files by current output handle usage and system limits.
        std::size_t const max_open_input_files =
            io_limits::clamp_open_inputs(io_soft_limit, dest_to_output.size());
        std::size_t const max_in_size = std::max<std::size_t>(1, max_open_input_files);

        // Wait for the number of open readers in the repacker to go below `limit`
        auto wait_for_open_readers_below = [&](std::size_t limit) {
            auto last_update = std::chrono::steady_clock::now();
            while (repacker->currently_open_file_reader_count() >= limit) {
                std::this_thread::sleep_for(std::chrono::milliseconds(100));
                poll_python_interrupt();

                auto const now = std::chrono::steady_clock::now();
                if (now - last_update >= std::chrono::milliseconds(2000)) {
                    progress_bar.update(total_reads_completed + repacker->reads_completed());
                    progress_bar.set_task(
                        batch_prefix + "Waiting for queued writes to complete from "
                        + std::to_string(repacker->currently_open_file_reader_count())
                        + "files...");
                    last_update = now;
                }
            }
        };

        // Wait for the repacker to finish with it's currently open readers
        auto wait_for_open_readers_zero = [&]() {
            auto last_update = std::chrono::steady_clock::now();
            while (repacker->currently_open_file_reader_count() > 0) {
                std::this_thread::sleep_for(std::chrono::milliseconds(100));
                poll_python_interrupt();

                auto const now = std::chrono::steady_clock::now();
                if (now - last_update >= std::chrono::milliseconds(2000)) {
                    progress_bar.update(total_reads_completed + repacker->reads_completed());
                    progress_bar.set_task(batch_prefix + "Waiting for batch IO to complete...");
                    last_update = now;
                }
            }
        };

        // Walk each input file in chunks for this output batch.
        for (std::size_t in_st = 0; in_st < inputs.size(); in_st += max_in_size) {
            poll_python_interrupt();
            std::size_t const in_end = std::min(in_st + max_in_size, inputs.size());

            // Add an input in this chunk
            for (std::size_t in_idx = in_st; in_idx < in_end; ++in_idx) {
                poll_python_interrupt();
                auto const & input_path = inputs[in_idx];

                // Keep in-flight readers below chunk limit.
                wait_for_open_readers_below(max_in_size);

                // Clear previous row selections from a previous input file.
                for (auto & output_file : dest_to_output) {
                    output_file.clear_per_input_working_data();
                }

                // "Batch [i/N]: Subsetting {input}"
                progress_bar.set_task(
                    batch_prefix + "Subsetting " + input_path.filename().string());

                // Open the input file
                auto input_reader_opt = pod5::open_file_reader(input_path.string(), input_options);
                if (!input_reader_opt.ok()) {
                    std::cerr << "Failed to open input file: " << input_path << std::endl;
                    throw std::runtime_error("Failed to open input POD5 file");
                }
                auto const & input_reader = *input_reader_opt;
                if (!issued_migration_warning && out_st == 0) {
                    auto const pre_migration_version = input_reader->file_version_pre_migration();
                    auto const post_migration_version =
                        input_reader->schema_metadata().writing_pod5_version;
                    if (pre_migration_version != post_migration_version) {
                        std::cerr << "Warning: Migrated an input from POD5 version "
                                  << pre_migration_version.to_string() << " to "
                                  << post_migration_version.to_string()
                                  << " while subsetting. This can affect performance "
                                     "significantly. Consider updating input files."
                                  << std::endl;
                    }
                    issued_migration_warning = true;
                }

                // Walk the input file batches:
                for (std::size_t i = 0; i < input_reader->num_read_record_batches(); ++i) {
                    poll_python_interrupt();
                    auto batch = input_reader->read_read_record_batch(i);
                    if (!batch.ok()) {
                        std::cerr << "Failed to read batch " << i
                                  << " from input file: " << input_path << std::endl;
                        throw std::runtime_error("Failed to read read record batch from POD5 file");
                    }

                    // Test each read id in the batch to see if we want it:
                    auto const & read_id_column = batch->read_id_column();
                    for (std::int64_t row = 0; row < read_id_column->length(); ++row) {
                        if ((row & 0x3FF) == 0) {
                            poll_python_interrupt();
                        }
                        auto const found = read_id_lookup.equal_range(read_id_column->Value(row));
                        for (auto it = found.first; it != found.second; ++it) {
                            dest_to_output[it->second].add_row(row);
                            found_read_count += 1;
                        }
                    }

                    // Store how many rows in this batch were selected:
                    for (auto & output_file : dest_to_output) {
                        output_file.finish_batch();
                    }

                    progress_bar.update(total_reads_completed + repacker->reads_completed());
                }

                // Submit selected reads to each output:
                for (auto & output_file : dest_to_output) {
                    repacker->add_selected_reads_to_output(
                        output_file.repacker_output,
                        input_reader,
                        gsl::make_span(output_file.batch_counts),
                        gsl::make_span(output_file.all_batch_rows));
                }
            }

            // Batch drain barrier for inputs in this output batch.
            wait_for_open_readers_zero();
        }

        // Set this output batch to finished:
        std::thread finisher([&] {
            for (auto & output_file : dest_to_output) {
                repacker->set_output_finished(output_file.repacker_output);
            }
        });
        auto join_finisher = gsl::finally([&] {
            if (finisher.joinable()) {
                finisher.join();
            }
        });

        // Wait for this batch to complete:
        progress_bar.set_task(batch_prefix + "Waiting for batch IO to complete...");
        try {
            while (!repacker->is_complete()) {
                std::this_thread::sleep_for(std::chrono::milliseconds(100));
                poll_python_interrupt();
                progress_bar.update(total_reads_completed + repacker->reads_completed());
            }
        } catch (pybind11::error_already_set const &) {
            throw;
        } catch (std::exception const & e) {
            std::cout << "\nError during repacking: " << e.what() << std::endl;
        }

        if (finisher.joinable()) {
            finisher.join();
        }

        repacker->finish();
        total_reads_completed += repacker->reads_completed();
    }
    progress_bar.set_task("Finished");

    if (found_read_count < total_requested_read_ids && !missing_ok) {
        throw std::runtime_error("Missing read_ids from inputs but --missing-ok not set");
    }

    // Clear created output files from cleanup since we succeeded:
    created_output_files.clear();
}


================================================
FILE: c++/pod5_format_pybind/subset.h
================================================
#include <pybind11/stl/filesystem.h>

#include <filesystem>
#include <map>
#include <string>
#include <vector>

void subset_pod5s_with_mapping(
    std::vector<std::filesystem::path> inputs,
    std::filesystem::path output,
    std::map<std::string, std::vector<std::string>> read_id_to_dest,
    bool missing_ok,
    bool duplicate_ok,
    bool force_overwrite);


================================================
FILE: c++/pod5_format_pybind/utils.h
================================================
#pragma once

#include "pod5_format/result.h"

inline void raise_error(arrow::Status const & status)
{
    throw std::runtime_error(status.ToString());
}

template <typename T>
inline void raise_error(arrow::Result<T> const & result)
{
    throw std::runtime_error(result.status().ToString());
}

#define POD5_PYTHON_RETURN_NOT_OK(statement) \
    do {                                     \
        auto const _res = (statement);       \
        if (!_res.ok()) {                    \
            raise_error(_res);               \
        }                                    \
    } while (false)

#define POD5_PYTHON_ASSIGN_OR_RAISE_IMPL(result_name, lhs, rexpr) \
    auto && result_name = (rexpr);                                \
    if (!(result_name).ok()) {                                    \
        raise_error(result_name);                                 \
    }                                                             \
    lhs = std::move(result_name).ValueUnsafe();

#define POD5_PYTHON_ASSIGN_OR_RAISE(lhs, rexpr) \
    POD5_PYTHON_ASSIGN_OR_RAISE_IMPL(           \
        ARROW_ASSIGN_OR_RAISE_NAME(_error_or_value, __COUNTER__), lhs, rexpr);

inline void throw_on_error(pod5::Status const & s)
{
    if (!s.ok()) {
        throw std::runtime_error(s.ToString());
    }
}

template <typename T>
inline T throw_on_error(pod5::Result<T> const & s)
{
    if (!s.ok()) {
        throw std::runtime_error(s.status().ToString());
    }
    return *s;
}


================================================
FILE: c++/test/CMakeLists.txt
================================================

add_executable(pod5_unit_tests
    main.cpp
    c_api_null_input.cpp
    c_api_test_utils.h
    c_api_tests.cpp
    c_api_build_test.c
    file_reader_writer_tests.cpp
    output_stream_tests.cpp
    read_table_writer_utils_tests.cpp
    read_table_tests.cpp
    run_info_table_tests.cpp
    schema_tests.cpp
    signal_compression_tests.cpp
    signal_table_tests.cpp
    svb16_scalar_tests.cpp
    svb16_x64_tests.cpp
    test_utils.h
    thread_pool_tests.cpp
    utils.h
    uuid_tests.cpp
)

if (${CMAKE_CXX_COMPILER_ID} MATCHES "Clang")
    set_source_files_properties(c_api_build_test.c PROPERTIES COMPILE_OPTIONS "-Wdocumentation")
endif()

target_link_libraries(pod5_unit_tests
    PUBLIC
        pod5_format
        ${maybe_public_libs}
)

set_property(TARGET pod5_unit_tests PROPERTY CXX_STANDARD 20)
if (NOT MSVC)
    target_compile_options(pod5_unit_tests PRIVATE ${pod5_warning_options})
endif()

add_test(
    NAME pod5_unit_tests
    COMMAND pod5_unit_tests
)


================================================
FILE: c++/test/TemporaryDirectory.h
================================================
#pragma once

#include "pod5_format/uuid.h"

#include <filesystem>

namespace ont { namespace testutils {

static std::string make_unique_name()
{
    std::random_device gen;
    auto uuid_gen = pod5::BasicUuidRandomGenerator<std::random_device>{gen};
    return to_string(uuid_gen());
}

/// A scoped directory with a fixed name.
class TemporaryDirectory {
public:
    /// Where to create the directory.
    enum class Location { CurrentDir, TempDir };
    enum class DeleteBehaviour { AfterOnly, BeforeAndAfter };

    /// Creates a random temporary directory
    TemporaryDirectory()
    : TemporaryDirectory(make_unique_name(), Location::TempDir, DeleteBehaviour::AfterOnly)
    {
    }

    /// Create a directory.
    explicit TemporaryDirectory(std::filesystem::path path, DeleteBehaviour delete_behaviour)
    : TemporaryDirectory(std::move(path), Location::CurrentDir, delete_behaviour)
    {
    }

    /// Create a directory.
    explicit TemporaryDirectory(
        std::filesystem::path path,
        Location location = Location::CurrentDir,
        DeleteBehaviour delete_behaviour = DeleteBehaviour::AfterOnly)
    {
        if (!path.is_absolute()) {
            if (location == Location::CurrentDir) {
                path = std::filesystem::absolute(path);
            } else {
                path = std::filesystem::temp_directory_path() / path;
            }
        }
        if (delete_behaviour == DeleteBehaviour::BeforeAndAfter) {
            std::filesystem::remove_all(m_path);
        }
        std::filesystem::create_directories(path);
        m_path = path;
    }

    TemporaryDirectory(TemporaryDirectory const &) = delete;
    TemporaryDirectory & operator=(TemporaryDirectory const &) = delete;

    TemporaryDirectory(TemporaryDirectory &&) = default;
    TemporaryDirectory & operator=(TemporaryDirectory &&) = default;

    /// Remove the referenced directory.
    ///
    /// Does nothing if this is not a valid object.
    ~TemporaryDirectory()
    {
        if (!m_path.empty()) {
            std::error_code error;
            std::filesystem::remove_all(m_path, error);
        }
    }

    /// Path to the directory.
    std::filesystem::path const & path() const { return m_path; }

    explicit operator bool() const { return !m_path.empty(); }

private:
    std::filesystem::path m_path;
};

template <class CharType, class CharTrait>
std::basic_ostream<CharType, CharTrait> & operator<<(
    std::basic_ostream<CharType, CharTrait> & os,
    TemporaryDirectory const & td)
{
    return os << "TemporaryDirectory{ " << td.path() << " }";
}

}}  // namespace ont::testutils


================================================
FILE: c++/test/c_api_build_test.c
================================================
#include "pod5_format/c_api.h"

// Build check to verify a c file can include the c_api


================================================
FILE: c++/test/c_api_null_input.cpp
================================================
#include "c_api_test_utils.h"
#include "pod5_format/c_api.h"
#include "utils.h"

#include <bit>
#include <numeric>
#include <string_view>

namespace {

void pod5_reset_error()
{
    pod5_vbz_compressed_signal_max_size(1);
    REQUIRE_POD5_OK(pod5_get_error_no());
    REQUIRE(pod5_get_error_string() == std::string_view{});
}

namespace detail {

template <std::size_t PtrIdx, typename... Args>
constexpr std::size_t ptr_idx_to_arg_idx()
{
    // Count how many pointers we've seen at each arg.
    std::size_t ptr_count[]{static_cast<std::size_t>(std::is_pointer_v<Args>)...};
    std::partial_sum(std::begin(ptr_count), std::end(ptr_count), std::begin(ptr_count));

    // Find which arg matches our index.
    for (std::size_t arg_i = 0; arg_i < std::size(ptr_count); arg_i++) {
        if (ptr_count[arg_i] == PtrIdx + 1) {
            return arg_i;
        }
    }

    throw "Cannot find arg for ptr";
}

template <std::size_t PtrIdx, typename... Args>
void make_ptr_null_impl(std::tuple<Args...> & args, std::uint64_t valid_ptr_bitset)
{
    // Grab the arg that we'll be modifying.
    constexpr std::size_t ArgIdx = ptr_idx_to_arg_idx<PtrIdx, Args...>();
    auto & arg = std::get<ArgIdx>(args);
    using ArgT = std::remove_reference_t<decltype(arg)>;
    static_assert(std::is_pointer_v<ArgT>);

    // If the arg isn't a valid one then replace it with a nullptr.
    auto const valid = (valid_ptr_bitset >> PtrIdx) & 1;
    if (!valid) {
        arg = nullptr;
    }
}

template <typename... Args, std::size_t... PtrIdxs>
void make_ptrs_null(
    std::tuple<Args...> & args,
    std::uint64_t valid_ptr_bitset,
    std::index_sequence<PtrIdxs...>)
{
    (make_ptr_null_impl<PtrIdxs>(args, valid_ptr_bitset), ...);
}

template <typename... Args, std::size_t... ArgIdxs>
auto unpack_and_call(
    pod5_error_t (*func)(Args...),
    std::tuple<Args...> args,
    std::index_sequence<ArgIdxs...>)
{
    return func(std::get<ArgIdxs>(args)...);
}

}  // namespace detail

template <typename... Args>
void call_with_nulls(pod5_error_t (*func)(Args...), Args... args)
{
    auto const valid_inputs = std::make_tuple(args...);

    constexpr std::size_t num_args = sizeof...(Args);
    static_assert(num_args <= 64, "uint64_t isn't big enough for a bitmask");
    constexpr std::size_t num_pointers = (std::is_pointer_v<Args> + ...);

    constexpr auto ArgIdxs = std::make_index_sequence<num_args>();
    constexpr auto PtrIdxs = std::make_index_sequence<num_pointers>();

    // Try every combination of NULL for the pointers.
    for (std::uint64_t valid_ptr_bitset = 0; std::popcount(valid_ptr_bitset) != num_pointers;
         valid_ptr_bitset++)
    {
        CAPTURE(valid_ptr_bitset);

        // Replace some args with nulls.
        auto inputs = valid_inputs;
        detail::make_ptrs_null(inputs, valid_ptr_bitset, PtrIdxs);

        // Make the call.
        pod5_reset_error();
        pod5_error_t const result = detail::unpack_and_call(func, inputs, ArgIdxs);

        // Check that it was an error.
        // TODO: We could improve this to check that the first invalid arg matches the error that's
        // reported (ie null string, null file, etc...), but this is already overengineered enough.
        //int const first_ptr = std::countr_zero(~valid_ptr_bitset); // codespell:ignore
        CHECK_POD5_NOT_OK(result);
        CHECK_THAT(pod5_get_error_string(), Catch::Matchers::Contains("null"));
    }
}

TEST_CASE("NULL input doesn't crash")
{
    using Catch::Matchers::Contains;

    pod5_init();
    auto cleanup = gsl::finally([] { pod5_terminate(); });

    // Make a temporary file for the read API to use.
    static constexpr char const temporary_filename[] = "./foo_c_api.pod5";
    {
        REQUIRE(remove_file_if_exists(temporary_filename).ok());
        Pod5FileWriter_t * writer = pod5_create_file(temporary_filename, "c_software", nullptr);
        REQUIRE_POD5_OK(pod5_get_error_no());
        REQUIRE(writer);

        std::int16_t pore_type_id{};
        REQUIRE_POD5_OK(pod5_add_pore(&pore_type_id, writer, "pore_type"));

        std::int16_t run_info_id{};
        size_t const num_kv_pairs = 1;
        char const * keys[]{"key"};
        char const * values[]{"value"};
        REQUIRE_POD5_OK(pod5_add_run_info(
            &run_info_id,
            writer,
            "acquisition_id",
            1,
            1,
            -1,
            num_kv_pairs,
            keys,
            values,
            "experiment_name",
            "flow_cell_id",
            "flow_cell_product_code",
            "protocol_name",
            "protocol_run_id",
            1,
            "sample_id",
            1,
            "sequencing_kit",
            "sequencer_position",
            "sequencer_position_type",
            "software",
            "system_name",
            "system_type",
            num_kv_pairs,
            keys,
            values));

        read_id_t const read_id{};
        uint32_t const read_number{};
        uint64_t const start_sample{};
        float const median_before{};
        uint16_t const channel{};
        uint8_t const well{};
        float const calibration_offset{};
        float const calibration_scale{};
        pod5_end_reason_t const end_reason{};
        uint8_t const end_reason_forced{};
        uint64_t const num_minknow_events{};
        float const tracked_scaling_scale{};
        float const tracked_scaling_shift{};
        float const predicted_scaling_scale{};
        float const predicted_scaling_shift{};
        uint32_t const num_reads_since_mux_change{};
        float const time_since_mux_change{};
        float const open_pore_level{};

        ReadBatchRowInfoArrayV3 const row_data_v3{
            &read_id,
            &read_number,
            &start_sample,
            &median_before,
            &channel,
            &well,
            &pore_type_id,
            &calibration_offset,
            &calibration_scale,
            &end_reason,
            &end_reason_forced,
            &run_info_id,
            &num_minknow_events,
            &tracked_scaling_scale,
            &tracked_scaling_shift,
            &predicted_scaling_scale,
            &predicted_scaling_shift,
            &num_reads_since_mux_change,
            &time_since_mux_change};

        int16_t const signal_data[]{1, 2, 3, 4, 5};
        uint32_t const signal_size = std::size(signal_data);
        auto * signal_data_ptr = signal_data;

        REQUIRE_POD5_OK(pod5_add_reads_data(
            writer,
            1,
            READ_BATCH_ROW_INFO_VERSION_3,
            &row_data_v3,
            &signal_data_ptr,
            &signal_size));

        ReadBatchRowInfoArrayV4 const row_data_v4{
            &read_id,
            &read_number,
            &start_sample,
            &median_before,
            &channel,
            &well,
            &pore_type_id,
            &calibration_offset,
            &calibration_scale,
            &end_reason,
            &end_reason_forced,
            &run_info_id,
            &num_minknow_events,
            &tracked_scaling_scale,
            &tracked_scaling_shift,
            &predicted_scaling_scale,
            &predicted_scaling_shift,
            &num_reads_since_mux_change,
            &time_since_mux_change,
            &open_pore_level};

        REQUIRE_POD5_OK(pod5_add_reads_data(
            writer,
            1,
            READ_BATCH_ROW_INFO_VERSION_4,
            &row_data_v4,
            &signal_data_ptr,
            &signal_size));

        REQUIRE_POD5_OK(pod5_close_and_free_writer(writer));
    }

    SECTION("Reader API")
    {
        {
            INFO("pod5_open_file")

            pod5_reset_error();
            CHECK(pod5_open_file(nullptr) == nullptr);
            CHECK_THAT(pod5_get_error_string(), Contains("null string passed"));
        }

        {
            INFO("pod5_open_file_options")

            Pod5ReaderOptions_t options{};

            pod5_reset_error();
            CHECK(pod5_open_file_options(nullptr, nullptr) == nullptr);
            CHECK_THAT(pod5_get_error_string(), Contains("null string passed"));

            pod5_reset_error();
            CHECK(pod5_open_file_options(temporary_filename, nullptr) == nullptr);
            CHECK_THAT(pod5_get_error_string(), Contains("null passed"));

            pod5_reset_error();
            CHECK(pod5_open_file_options(nullptr, &options) == nullptr);
            CHECK_THAT(pod5_get_error_string(), Contains("null string passed"));
        }

        {
            INFO("pod5_close_and_free_reader")

            pod5_reset_error();
            CHECK_POD5_OK(pod5_close_and_free_reader(nullptr));
        }

        // The rest of these functions require a reader.
        Pod5FileReader_t * mutable_reader = pod5_open_file(temporary_filename);
        REQUIRE(mutable_reader);
        auto close_reader =
            gsl::finally([&mutable_reader] { pod5_close_and_free_reader(mutable_reader); });
        Pod5FileReader_t const * reader = mutable_reader;

        {
            INFO("pod5_get_file_info")

            FileInfo file_info{};
            call_with_nulls(pod5_get_file_info, reader, &file_info);
        }

        {
            INFO("pod5_get_file_read_table_location")

            EmbeddedFileData_t file_data{};
            call_with_nulls(pod5_get_file_read_table_location, reader, &file_data);
        }

        {
            INFO("pod5_get_file_signal_table_location")

            EmbeddedFileData_t file_data{};
            call_with_nulls(pod5_get_file_signal_table_location, reader, &file_data);
        }

        {
            INFO("pod5_get_file_run_info_table_location")

            EmbeddedFileData_t file_data{};
            call_with_nulls(pod5_get_file_run_info_table_location, reader, &file_data);
        }

        {
            INFO("pod5_get_read_count")

            size_t count{};
            call_with_nulls(pod5_get_read_count, reader, &count);
        }

        {
            INFO("pod5_get_read_ids")

            std::array<read_id_t, 3> read_ids{};
            call_with_nulls(pod5_get_read_ids, reader, read_ids.size(), read_ids.data());
        }

        {
            INFO("pod5_plan_traversal")

            constexpr std::size_t read_id_count = 1;
            uint8_t const read_id_array[read_id_count * 16]{};
            uint32_t batch_counts{};
            uint32_t batch_rows{};
            size_t find_success_count_out{};
            call_with_nulls(
                pod5_plan_traversal,
                reader,
                read_id_array,
                read_id_count,
                &batch_counts,
                &batch_rows,
                &find_success_count_out);
        }

        {
            INFO("pod5_get_read_batch_count")

            size_t count{};
            call_with_nulls(pod5_get_read_batch_count, &count, reader);
        }

        {
            INFO("pod5_get_read_batch")

            Pod5ReadRecordBatch_t * batch = nullptr;
            size_t index{};
            call_with_nulls(pod5_get_read_batch, &batch, reader, index);
        }

        {
            INFO("pod5_free_read_batch")

            pod5_reset_error();
            CHECK_POD5_OK(pod5_free_read_batch(nullptr));
        }

        // The rest of these functions require a batch.
        Pod5ReadRecordBatch_t * mutable_batch = nullptr;
        CHECK_POD5_OK(pod5_get_read_batch(&mutable_batch, reader, 0));
        REQUIRE(mutable_batch);
        auto free_batch = gsl::finally([&mutable_batch] { pod5_free_read_batch(mutable_batch); });
        Pod5ReadRecordBatch_t const * batch = mutable_batch;

        {
            INFO("pod5_get_read_batch_row_count")

            size_t count{};
            call_with_nulls(pod5_get_read_batch_row_count, &count, batch);
        }

        {
            INFO("pod5_get_read_batch_row_info_data")

            ReadBatchRowInfoV4 row_info{};
            size_t row = 0;
            uint16_t struct_version = READ_BATCH_ROW_INFO_VERSION;
            uint16_t read_table_version{};
            call_with_nulls(
                pod5_get_read_batch_row_info_data,
                batch,
                row,
                struct_version,
                static_cast<void *>(&row_info),
                &read_table_version);
        }

        {
            INFO("pod5_get_signal_row_indices")

            size_t row = 0;
            uint64_t indices[1];
            call_with_nulls(
                pod5_get_signal_row_indices,
                batch,
                row,
                static_cast<int64_t>(std::size(indices)),
                indices);
        }

        {
            INFO("pod5_get_calibration_extra_info")

            size_t row = 0;
            CalibrationExtraData_t data{};
            call_with_nulls(pod5_get_calibration_extra_info, batch, row, &data);
        }

        {
            INFO("pod5_get_run_info")

            int16_t index = 0;
            RunInfoDictData_t * data = nullptr;
            call_with_nulls(pod5_get_run_info, batch, index, &data);
        }

        {
            INFO("pod5_get_file_run_info")

            run_info_index_t run_info_index = 0;
            RunInfoDictData_t * run_info_data = nullptr;
            call_with_nulls(pod5_get_file_run_info, reader, run_info_index, &run_info_data);
        }

        {
            INFO("pod5_free_run_info")

            pod5_reset_error();
            CHECK_POD5_OK(pod5_free_run_info(nullptr));
        }

        {
            INFO("pod5_release_run_info")

            pod5_reset_error();
#ifndef _WIN32
#pragma GCC diagnostic push
#pragma GCC diagnostic ignored "-Wdeprecated-declarations"
#endif
            CHECK_POD5_OK(pod5_release_run_info(nullptr));
#ifndef _WIN32
#pragma GCC diagnostic pop
#endif
        }

        {
            INFO("pod5_get_file_run_info_count")

            run_info_index_t count{};
            call_with_nulls(pod5_get_file_run_info_count, reader, &count);
        }

        {
            INFO("pod5_get_end_reason")

            int16_t index = 0;
            pod5_end_reason end_reason{};
            std::array<char, 10> string{};
            size_t string_len = string.size();
            call_with_nulls(
                pod5_get_end_reason, batch, index, &end_reason, string.data(), &string_len);
        }

        {
            INFO("pod5_get_pore_type")

            int16_t index = 0;
            std::array<char, 10> string{};
            size_t string_len = string.size();
            call_with_nulls(pod5_get_pore_type, batch, index, string.data(), &string_len);
        }

        {
            INFO("pod5_get_signal_row_info")

            std::array<uint64_t, 1> const signal_rows{};
            SignalRowInfo * signal_row_info = nullptr;
            call_with_nulls(
                pod5_get_signal_row_info,
                reader,
                signal_rows.size(),
                signal_rows.data(),
                &signal_row_info);
        }

        {
            INFO("pod5_free_signal_row_info")

            pod5_reset_error();
            CHECK_POD5_OK(pod5_free_signal_row_info(0, nullptr));
            CHECK_POD5_NOT_OK(pod5_free_signal_row_info(1, nullptr));
        }

        {
            INFO("pod5_get_signal")

            // We need a signal row info.
            uint64_t const signal_row_index = 0;
            SignalRowInfo_t * signal_row_info = nullptr;
            CHECK_POD5_OK(pod5_get_signal_row_info(reader, 1, &signal_row_index, &signal_row_info));
            REQUIRE(signal_row_info);
            auto free_signal_row_info = gsl::finally(
                [&signal_row_info] { pod5_free_signal_row_info(1, &signal_row_info); });

            std::array<int16_t, 10> samples{};
            call_with_nulls(
                pod5_get_signal,
                reader,
                static_cast<SignalRowInfo_t const *>(signal_row_info),
                samples.size(),
                samples.data());
        }

        {
            INFO("pod5_get_read_complete_sample_count")

            size_t row = 0;
            size_t count{};
            call_with_nulls(pod5_get_read_complete_sample_count, reader, batch, row, &count);
        }

        {
            INFO("pod5_get_read_complete_signal")

            size_t row = 1;
            std::array<int16_t, 10> samples{};
            call_with_nulls(
                pod5_get_read_complete_signal, reader, batch, row, samples.size(), samples.data());
        }
    }

    SECTION("Writer API")
    {
        {
            INFO("pod5_create_file")

            pod5_reset_error();
            CHECK(pod5_create_file(nullptr, nullptr, nullptr) == nullptr);
            CHECK_THAT(pod5_get_error_string(), Contains("null string passed"));

            pod5_reset_error();
            CHECK(pod5_create_file(temporary_filename, nullptr, nullptr) == nullptr);
            CHECK_THAT(pod5_get_error_string(), Contains("null string passed"));

            pod5_reset_error();
            CHECK(pod5_create_file(nullptr, temporary_filename, nullptr) == nullptr);
            CHECK_THAT(pod5_get_error_string(), Contains("null string passed"));
        }

        {
            INFO("pod5_close_and_free_writer")

            pod5_reset_error();
            CHECK_POD5_OK(pod5_close_and_free_writer(nullptr));
        }

        // The rest of these functions require a writer.
        REQUIRE(remove_file_if_exists(temporary_filename).ok());
        Pod5FileWriter_t * writer = pod5_create_file(temporary_filename, "c_software", nullptr);
        REQUIRE(writer);
        auto close_writer = gsl::finally([&writer] { pod5_close_and_free_writer(writer); });

        {
            INFO("pod5_add_pore")

            int16_t pore_index{};
            char const pore_type[] = "test";
            call_with_nulls(pod5_add_pore, &pore_index, writer, pore_type);
        }

        {
            INFO("pod5_add_run_info")

            int16_t run_info_index{};

            char const dummy_string[] = "test";

            char const * acquisition_id = dummy_string;
            int64_t acquisition_start_time_ms = 1;
            int16_t adc_max = 1;
            int16_t adc_min = -1;
            char const * experiment_name = dummy_string;
            char const * flow_cell_id = dummy_string;
            char const * flow_cell_product_code = dummy_string;
            char const * protocol_name = dummy_string;
            char const * protocol_run_id = dummy_string;
            int64_t protocol_start_time_ms = 1;
            char const * sample_id = dummy_string;
            uint16_t sample_rate = 1;
            char const * sequencing_kit = dummy_string;
            char const * sequencer_position = dummy_string;
            char const * sequencer_position_type = dummy_string;
            char const * software = dummy_string;
            char const * system_name = dummy_string;
            char const * system_type = dummy_string;

            size_t context_tags_count = 1;
            char const * context_tags_keys[]{dummy_string};
            char const * context_tags_values[]{dummy_string};

            size_t tracking_id_count = 1;
            char const * tracking_id_keys[]{dummy_string};
            char const * tracking_id_values[]{dummy_string};

            call_with_nulls(
                pod5_add_run_info,
                &run_info_index,
                writer,
                acquisition_id,
                acquisition_start_time_ms,
                adc_max,
                adc_min,
                context_tags_count,
                context_tags_keys,
                context_tags_values,
                experiment_name,
                flow_cell_id,
                flow_cell_product_code,
                protocol_name,
                protocol_run_id,
                protocol_start_time_ms,
                sample_id,
                sample_rate,
                sequencing_kit,
                sequencer_position,
                sequencer_position_type,
                software,
                system_name,
                system_type,
                tracking_id_count,
                tracking_id_keys,
                tracking_id_values);
        }

        {
            INFO("pod5_add_reads_data")

            uint32_t count = 1;
            uint16_t version = READ_BATCH_ROW_INFO_VERSION;
            ReadBatchRowInfoArray_t row_info{};
            int16_t const signal[]{1, 2, 3, 4, 5};
            int16_t const * signals[]{signal};
            uint32_t const signal_size = std::size(signal);

            call_with_nulls(
                pod5_add_reads_data,
                writer,
                count,
                version,
                static_cast<void const *>(&row_info),
                signals,
                &signal_size);
        }

        {
            INFO("pod5_add_reads_data_pre_compressed")

            uint32_t count = 1;
            uint16_t version = READ_BATCH_ROW_INFO_VERSION;
            ReadBatchRowInfoArray_t row_info{};

            char const read0_compressed_signal_chunk0[]{1, 2, 3, 4, 5};
            char const * read0_compressed_signal[]{read0_compressed_signal_chunk0};
            size_t const read0_compressed_signal_sizes[]{std::size(read0_compressed_signal_chunk0)};
            uint32_t const read0_sample_counts[]{3};
            size_t const read0_signal_chunk_count = std::size(read0_compressed_signal);

            char const ** compressed_signals[]{read0_compressed_signal};
            size_t const * compressed_signal_sizes[]{read0_compressed_signal_sizes};
            uint32_t const * sample_counts[]{read0_sample_counts};
            size_t const signal_chunk_counts[]{read0_signal_chunk_count};

            call_with_nulls(
                pod5_add_reads_data_pre_compressed,
                writer,
                count,
                version,
                static_cast<void const *>(&row_info),
                compressed_signals,
                compressed_signal_sizes,
                sample_counts,
                signal_chunk_counts);
        }
    }

    SECTION("VBZ API")
    {
        {
            INFO("pod5_vbz_compress_signal")

            std::array<int16_t, 10> const signal{};
            std::array<char, 10> compressed{};
            size_t compressed_size = compressed.size();
            call_with_nulls(
                pod5_vbz_compress_signal,
                signal.data(),
                signal.size(),
                compressed.data(),
                &compressed_size);
        }

        {
            INFO("pod5_vbz_decompress_signal")

            std::array<char, 10> const compressed{};
            std::array<int16_t, 10> signal{};
            call_with_nulls(
                pod5_vbz_decompress_signal,
                compressed.data(),
                compressed.size(),
                signal.size(),
                signal.data());
        }
    }

    SECTION("Misc API")
    {
        {
            INFO("pod5_format_read_id")

            read_id_t const read_id{};
            char * string = nullptr;
            call_with_nulls(pod5_format_read_id, read_id, string);
        }
    }
}

}  // namespace


================================================
FILE: c++/test/c_api_test_utils.h
================================================
#pragma once

#include "pod5_format/c_api.h"

#include <catch2/catch.hpp>

#include <string>

#define CHECK_POD5_OK(statement)                                                    \
    do {                                                                            \
        auto const & _res = (statement);                                            \
        CHECK_THAT(testutils::Pod5C_Result::capture(_res), testutils::IsPod5COk()); \
    } while (false)

#define REQUIRE_POD5_OK(statement)                                                    \
    do {                                                                              \
        auto const & _res = (statement);                                              \
        REQUIRE_THAT(testutils::Pod5C_Result::capture(_res), testutils::IsPod5COk()); \
    } while (false)

#define CHECK_POD5_NOT_OK(statement)                                                 \
    do {                                                                             \
        auto const & _res = (statement);                                             \
        CHECK_THAT(testutils::Pod5C_Result::capture(_res), !testutils::IsPod5COk()); \
    } while (false)

#define REQUIRE_POD5_NOT_OK(statement)                                                 \
    do {                                                                               \
        auto const & _res = (statement);                                               \
        REQUIRE_THAT(testutils::Pod5C_Result::capture(_res), !testutils::IsPod5COk()); \
    } while (false)

namespace testutils {

struct Pod5C_Result {
    static Pod5C_Result capture(pod5_error_t err_num)
    {
        return Pod5C_Result{err_num, pod5_get_error_string()};
    }

    pod5_error_t error_code;
    std::string error_string;
};

class IsPod5COk : public Catch::MatcherBase<Pod5C_Result> {
public:
    IsPod5COk() = default;

    bool match(Pod5C_Result const & result) const override { return result.error_code == POD5_OK; }

    virtual std::string describe() const override { return "== POD5_OK"; }
};

}  // namespace testutils

template <>
struct Catch::StringMaker<testutils::Pod5C_Result> {
    static std::string convert(testutils::Pod5C_Result const & value)
    {
        return "{ code: " + std::to_string(value.error_code) + "| " + value.error_string + " }";
    }
};


================================================
FILE: c++/test/c_api_tests.cpp
================================================
#include "pod5_format/c_api.h"

#include "c_api_test_utils.h"
#include "pod5_format/file_reader.h"
#include "pod5_format/schema_metadata.h"
#include "pod5_format/uuid.h"
#include "pod5_format/version.h"
#include "utils.h"

#include <catch2/catch.hpp>
#include <gsl/gsl-lite.hpp>

#include <algorithm>
#include <iostream>
#include <numeric>

struct Pod5ReadId {
    Pod5ReadId() = default;

    Pod5ReadId(pod5::Uuid const & uid) { uid.to_c_array(read_id); }

    pod5::Uuid as_uuid() const { return pod5::Uuid{read_id}; }

    bool operator==(Pod5ReadId const & other) const { return as_uuid() == other.as_uuid(); }

    read_id_t read_id;
};

std::ostream & operator<<(std::ostream & str, Pod5ReadId rid) { return str << rid.as_uuid(); }

SCENARIO("C API Reads")
{
    static constexpr char const * filename = "./foo_c_api.pod5";

    pod5_init();
    auto fin = gsl::finally([] { pod5_terminate(); });

    std::mt19937 gen{Catch::rngSeed()};
    auto uuid_gen = pod5::UuidRandomGenerator{gen};
    auto input_read_id = uuid_gen();
    auto input_read_id_2 = uuid_gen();
    std::vector<int16_t> signal_1(10);
    std::iota(signal_1.begin(), signal_1.end(), -20000);

    std::vector<int16_t> signal_2(20);
    std::iota(signal_2.begin(), signal_2.end(), 0);

    std::int16_t adc_min = -4096;
    std::int16_t adc_max = 4095;

    float calibration_offset = 54.0f;
    float calibration_scale = 100.0f;

    float predicted_scale = 2.3f;
    float predicted_shift = 10.0f;
    float tracked_scale = 4.3f;
    float tracked_shift = 15.0f;
    std::uint32_t num_reads_since_mux_change = 1234;
    float time_since_mux_change = 2.4f;
    float open_pore_level = 123.0f;
    std::uint64_t num_minknow_events = 104;

    // Write the file:
    {
        CHECK_POD5_OK(pod5_get_error_no());
        CHECK_FALSE(pod5_create_file(NULL, "c_software", NULL));
        CHECK(pod5_get_error_no() == POD5_ERROR_INVALID);
        CHECK_FALSE(pod5_create_file("", "c_software", NULL));
        CHECK(pod5_get_error_no() == POD5_ERROR_INVALID);
        CHECK_FALSE(pod5_create_file("", NULL, NULL));
        CHECK(pod5_get_error_no() == POD5_ERROR_INVALID);

        REQUIRE(remove_file_if_exists(filename).ok());

        auto file = pod5_create_file(filename, "c_software", NULL);
        REQUIRE(file);
        CHECK_POD5_OK(pod5_get_error_no());

        std::int16_t pore_type_id = -1;
        CHECK_POD5_OK(pod5_add_pore(&pore_type_id, file, "pore_type"));
        CHECK(pore_type_id == 0);

        std::vector<char const *> context_tags_keys{"thing", "foo"};
        std::vector<char const *> context_tags_values{"thing_val", "foo_val"};
        std::vector<char const *> tracking_id_keys{"baz", "other"};
        std::vector<char const *> tracking_id_values{"baz_val", "other_val"};

        std::uint32_t read_number = 12;
        std::uint64_t start_sample = 10245;
        float median_before = 200.0f;
        std::uint16_t channel = 43;
        std::uint8_t well = 4;
        pod5_end_reason_t end_reason = POD5_END_REASON_MUX_CHANGE;
        uint8_t end_reason_forced = false;
        auto read_id_array = (read_id_t const *)input_read_id.data();

        std::int16_t run_info_id = 0;
        ReadBatchRowInfoArrayV4 row_data{
            read_id_array,
            &read_number,
            &start_sample,
            &median_before,
            &channel,
            &well,
            &pore_type_id,
            &calibration_offset,
            &calibration_scale,
            &end_reason,
            &end_reason_forced,
            &run_info_id,
            &num_minknow_events,
            &tracked_scale,
            &tracked_shift,
            &predicted_scale,
            &predicted_shift,
            &num_reads_since_mux_change,
            &time_since_mux_change,
            &open_pore_level};

        std::int16_t const * signal_arr[] = {signal_1.data()};
        std::uint32_t signal_size[] = {(std::uint32_t)signal_1.size()};

        // Referencing a non-existent run id should fail:
        CHECK(
            pod5_add_reads_data(
                file, 1, READ_BATCH_ROW_INFO_VERSION_4, &row_data, signal_arr, signal_size)
            == POD5_ERROR_INVALID);

        // Now actually add the run info:
        CHECK_POD5_OK(pod5_add_run_info(
            &run_info_id,
            file,
            "acquisition_id",
            15400,
            adc_max,
            adc_min,
            context_tags_keys.size(),
            context_tags_keys.data(),
            context_tags_values.data(),
            "experiment_name",
            "flow_cell_id",
            "flow_cell_product_code",
            "protocol_name",
            "protocol_run_id",
            200000,
            "sample_id",
            4000,
            "sequencing_kit",
            "sequencer_position",
            "sequencer_position_type",
            "software",
            "system_name",
            "system_type",
            tracking_id_keys.size(),
            tracking_id_keys.data(),
            tracking_id_values.data()));
        CHECK(run_info_id == 0);

        CHECK_POD5_OK(pod5_add_reads_data(
            file, 1, READ_BATCH_ROW_INFO_VERSION_4, &row_data, signal_arr, signal_size));

        {
            auto compressed_read_max_size = pod5_vbz_compressed_signal_max_size(signal_2.size());
            std::vector<char> compressed_signal(compressed_read_max_size);
            char const * compressed_data[] = {compressed_signal.data()};
            char const ** compressed_data_ptr = compressed_data;
            std::size_t compressed_size[] = {compressed_signal.size()};
            std::size_t const * compressed_size_ptr = compressed_size;
            std::uint32_t signal_size[] = {(std::uint32_t)signal_2.size()};
            std::uint32_t const * signal_size_ptr = signal_size;
            pod5_vbz_compress_signal(
                signal_2.data(), signal_2.size(), compressed_signal.data(), compressed_size);

            std::size_t signal_counts = 1;

            auto read_id_array = (read_id_t const *)input_read_id_2.data();
            ReadBatchRowInfoArrayV3 row_data_v3{
                read_id_array,
                &read_number,
                &start_sample,
                &median_before,
                &channel,
                &well,
                &pore_type_id,
                &calibration_offset,
                &calibration_scale,
                &end_reason,
                &end_reason_forced,
                &run_info_id,
                &num_minknow_events,
                &tracked_scale,
                &tracked_shift,
                &predicted_scale,
                &predicted_shift,
                &num_reads_since_mux_change,
                &time_since_mux_change};

            CHECK_POD5_OK(pod5_add_reads_data_pre_compressed(
                file,
                1,
                READ_BATCH_ROW_INFO_VERSION_3,
                &row_data_v3,
                &compressed_data_ptr,
                &compressed_size_ptr,
                &signal_size_ptr,
                &signal_counts));
        }

        CHECK_POD5_OK(pod5_close_and_free_writer(file));
        CHECK_POD5_OK(pod5_get_error_no());
    }

    // Read the file back:
    {
        CHECK_POD5_OK(pod5_get_error_no());
        CHECK_FALSE(pod5_open_file(NULL));
        auto file = pod5_open_file(filename);
        CHECK_POD5_OK(pod5_get_error_no());
        CHECK(file);

        FileInfo_t file_info;
        CHECK_POD5_OK(pod5_get_file_info(file, &file_info));
        CHECK(file_info.version.major == pod5::Pod5MajorVersion);
        CHECK(file_info.version.minor == pod5::Pod5MinorVersion);
        CHECK(file_info.version.revision == pod5::Pod5RevVersion);
        {
            auto reader = pod5::open_file_reader(filename);
            pod5::Uuid file_identifier{file_info.file_identifier};
            CHECK(file_identifier == (*reader)->schema_metadata().file_identifier);
        }

        std::size_t read_count = 0;
        CHECK_POD5_OK(pod5_get_read_count(file, &read_count));
        REQUIRE(read_count == 2);

        std::vector<Pod5ReadId> read_ids(2);
        CHECK(pod5_get_read_ids(file, 1, (read_id_t *)read_ids.data()) != POD5_OK);
        CHECK_POD5_OK(pod5_get_read_ids(file, read_ids.size(), (read_id_t *)read_ids.data()));
        std::vector<Pod5ReadId> expected_read_ids{input_read_id, input_read_id_2};
        CHECK(read_ids == expected_read_ids);

        std::size_t batch_count = 0;
        CHECK_POD5_OK(pod5_get_read_batch_count(&batch_count, file));
        REQUIRE(batch_count == 1);

        Pod5ReadRecordBatch * batch_0 = nullptr;
        CHECK_POD5_OK(pod5_get_read_batch(&batch_0, file, 0));
        REQUIRE(batch_0);

        std::size_t row_count = 0;
        CHECK_POD5_OK(pod5_get_read_batch_row_count(&row_count, batch_0));
        REQUIRE(row_count == 2);

        // Check out of bounds accesses get errors
        {
            ReadBatchRowInfoV4 v3_struct;
            uint16_t input_version = 0;
            CHECK(
                pod5_get_read_batch_row_info_data(
                    batch_0, row_count, READ_BATCH_ROW_INFO_VERSION, &v3_struct, &input_version)
                == POD5_ERROR_INDEXERROR);

            std::vector<uint64_t> signal_row_indices{1};
            CHECK(
                pod5_get_signal_row_indices(
                    batch_0, row_count, signal_row_indices.size(), signal_row_indices.data())
                == POD5_ERROR_INDEXERROR);

            CalibrationExtraData calibration_extra_data{};
            CHECK(
                pod5_get_calibration_extra_info(batch_0, row_count, &calibration_extra_data)
                == POD5_ERROR_INDEXERROR);
        }

        for (std::size_t row = 0; row < row_count; ++row) {
            CAPTURE(row);
            auto signal = signal_1;
            if (row == 1) {
                signal = signal_2;
            }

            static_assert(
                std::is_same<ReadBatchRowInfoV4, ReadBatchRowInfo_t>::value,
                "Update this if new structs added");

            ReadBatchRowInfoV3 v3_struct;
            ReadBatchRowInfoV4 v4_struct;
            uint16_t input_version = 0;
            CHECK_POD5_OK(pod5_get_read_batch_row_info_data(
                batch_0, row, READ_BATCH_ROW_INFO_VERSION_3, &v3_struct, &input_version));
            CHECK(
                input_version
                == 4);  // We're reading from a v4 file, even if the input struct is v3.
            CHECK_POD5_OK(pod5_get_read_batch_row_info_data(
                batch_0, row, READ_BATCH_ROW_INFO_VERSION_4, &v4_struct, &input_version));
            CHECK(input_version == 4);

            auto check_v3_or_v4 = [&](auto name, auto const & input_struct) {
                CAPTURE(name);
                std::string formatted_uuid(36, '\0');
                CHECK_POD5_OK(pod5_format_read_id(input_struct.read_id, &formatted_uuid[0]));
                CHECK(
                    formatted_uuid
                    == to_string(*reinterpret_cast<pod5::Uuid const *>(input_struct.read_id)));

                CHECK(input_struct.read_number == 12);
                CHECK(input_struct.start_sample == 10245);
                CHECK(input_struct.median_before == 200.0f);
                CHECK(input_struct.channel == 43);
                CHECK(input_struct.well == 4);
                CHECK(input_struct.pore_type == 0);
                CHECK(input_struct.calibration_offset == calibration_offset);
                CHECK(input_struct.calibration_scale == calibration_scale);
                CHECK(input_struct.end_reason == 1);
                CHECK(input_struct.end_reason_forced == uint8_t{false});
                CHECK(input_struct.run_info == 0);
                CHECK(input_struct.num_minknow_events == num_minknow_events);
                CHECK(input_struct.tracked_scaling_scale == tracked_scale);
                CHECK(input_struct.tracked_scaling_shift == tracked_shift);
                CHECK(input_struct.predicted_scaling_scale == predicted_scale);
                CHECK(input_struct.predicted_scaling_shift == predicted_shift);
                CHECK(input_struct.num_reads_since_mux_change == num_reads_since_mux_change);
                CHECK(input_struct.time_since_mux_change == time_since_mux_change);
                CHECK(input_struct.signal_row_count == 1);
                CHECK(input_struct.num_samples == signal.size());
            };

            check_v3_or_v4("v3", v3_struct);
            check_v3_or_v4("v4", v4_struct);
            if (row == 0) {
                CHECK(v4_struct.open_pore_level == open_pore_level);
            } else {
                CHECK(std::isnan(v4_struct.open_pore_level));
            }

            std::vector<uint64_t> signal_row_indices(v3_struct.signal_row_count);
            CHECK_POD5_OK(pod5_get_signal_row_indices(
                batch_0, row, signal_row_indices.size(), signal_row_indices.data()));

            std::vector<SignalRowInfo *> signal_row_info(v3_struct.signal_row_count);
            CHECK_POD5_OK(pod5_get_signal_row_info(
                file,
                signal_row_indices.size(),
                signal_row_indices.data(),
                signal_row_info.data()));

            std::vector<int16_t> read_signal(signal_row_info.front()->stored_sample_count);
            REQUIRE(signal_row_info.front()->stored_sample_count == signal.size());
            CHECK_POD5_OK(pod5_get_signal(
                file,
                signal_row_info.front(),
                signal_row_info.front()->stored_sample_count,
                read_signal.data()));
            CHECK(read_signal == signal);

            std::size_t sample_count = 0;
            CHECK_POD5_OK(pod5_get_read_complete_sample_count(file, batch_0, row, &sample_count));
            CHECK(sample_count == signal_row_info.front()->stored_sample_count);
            CHECK_POD5_OK(pod5_get_read_complete_signal(
                file, batch_0, row, sample_count, read_signal.data()));
            CHECK(read_signal == signal);

            CHECK_POD5_OK(
                pod5_free_signal_row_info(signal_row_indices.size(), signal_row_info.data()));

            std::string expected_pore_type{"pore_type"};
            std::array<char, 128> char_buffer{};
            std::size_t returned_size = 2;  // deliberately too short!
            {
                CHECK(
                    pod5_get_pore_type(
                        batch_0, v3_struct.pore_type, char_buffer.data(), &returned_size)
                    == POD5_ERROR_STRING_NOT_LONG_ENOUGH);
                CHECK(returned_size == expected_pore_type.size() + 1);
            }
            {
                returned_size = char_buffer.size();
                CHECK_POD5_OK(pod5_get_pore_type(
                    batch_0, v3_struct.pore_type, char_buffer.data(), &returned_size));
                CHECK(returned_size == expected_pore_type.size() + 1);
                CHECK(std::string{char_buffer.data()} == expected_pore_type);
            }
            {
                returned_size = char_buffer.size();
                CHECK(
                    pod5_get_pore_type(batch_0, -1, char_buffer.data(), &returned_size)
                    == POD5_ERROR_INDEXERROR);
                CHECK(returned_size == char_buffer.size());
            }

            std::string expected_end_reason{"mux_change"};
            {
                returned_size = 2;  // deliberately too short!
                pod5_end_reason end_reason = POD5_END_REASON_UNKNOWN;
                CHECK(
                    pod5_get_end_reason(
                        batch_0,
                        v3_struct.end_reason,
                        &end_reason,
                        char_buffer.data(),
                        &returned_size)
                    == POD5_ERROR_STRING_NOT_LONG_ENOUGH);
                CHECK(returned_size == expected_end_reason.size() + 1);
            }
            {
                returned_size = char_buffer.size();
                pod5_end_reason end_reason = POD5_END_REASON_UNKNOWN;
                CHECK_POD5_OK(pod5_get_end_reason(
                    batch_0,
                    v3_struct.end_reason,
                    &end_reason,
                    char_buffer.data(),
                    &returned_size));
                CHECK(returned_size == expected_end_reason.size() + 1);
                CHECK(end_reason == POD5_END_REASON_MUX_CHANGE);
                CHECK(std::string{char_buffer.data()} == expected_end_reason);
            }
            // Check getting with an invalid input end reason index:
            {
                returned_size = char_buffer.size();
                pod5_end_reason end_reason = POD5_END_REASON_UNKNOWN;
                CHECK(
                    pod5_get_end_reason(
                        batch_0,
                        v3_struct.end_reason + 100,
                        &end_reason,
                        char_buffer.data(),
                        &returned_size)
                    == POD5_ERROR_INDEXERROR);
                CHECK(returned_size == char_buffer.size());
                CHECK(end_reason == POD5_END_REASON_UNKNOWN);
            }

            CalibrationExtraData calibration_extra_data{};
            CHECK_POD5_OK(pod5_get_calibration_extra_info(batch_0, row, &calibration_extra_data));
            CHECK(calibration_extra_data.digitisation == adc_max - adc_min + 1);
            CHECK(calibration_extra_data.range == 8192 * calibration_scale);
        }

        SECTION("Embedded files")
        {
            for (auto [get_file_location, name] : {
                     std::make_tuple(
                         pod5_get_file_read_table_location, "pod5_get_file_read_table_location"),
                     std::make_tuple(
                         pod5_get_file_signal_table_location,
                         "pod5_get_file_signal_table_location"),
                     std::make_tuple(
                         pod5_get_file_run_info_table_location,
                         "pod5_get_file_run_info_table_location"),
                 })
            {
                CAPTURE(name);
                EmbeddedFileData_t embedded_file_data{};
                CHECK_POD5_OK(get_file_location(file, &embedded_file_data));
                REQUIRE(embedded_file_data.file_name != nullptr);
                CHECK(embedded_file_data.file_name == std::string_view{filename});
                CHECK(embedded_file_data.offset > 0);
                CHECK(embedded_file_data.length > 0);
            }
        }

        run_info_index_t run_info_count = 0;
        CHECK_POD5_OK(pod5_get_file_run_info_count(file, &run_info_count));
        REQUIRE(run_info_count == 1);

        // Check getting invalid run info indexes fails correctly.
        RunInfoDictData * run_info_error = nullptr;
        CHECK(pod5_get_run_info(batch_0, -1, &run_info_error) == POD5_ERROR_INDEXERROR);
        CHECK_FALSE(run_info_error);
        CHECK(pod5_get_run_info(batch_0, run_info_count, &run_info_error) == POD5_ERROR_INDEXERROR);
        CHECK_FALSE(run_info_error);
        CHECK(pod5_get_file_run_info(file, -1, &run_info_error) == POD5_ERROR_INDEXERROR);
        CHECK_FALSE(run_info_error);
        CHECK(
            pod5_get_file_run_info(file, run_info_count, &run_info_error) == POD5_ERROR_INDEXERROR);
        CHECK_FALSE(run_info_error);

        auto check_run_info = [](RunInfoDictData * run_info) {
            REQUIRE(run_info);
            CHECK(run_info->tracking_id.size == 2);
            CHECK(run_info->tracking_id.keys[0] == std::string("baz"));
            CHECK(run_info->tracking_id.keys[1] == std::string("other"));
            CHECK(run_info->tracking_id.values[0] == std::string("baz_val"));
            CHECK(run_info->tracking_id.values[1] == std::string("other_val"));
            CHECK(run_info->context_tags.size == 2);
            CHECK(run_info->context_tags.keys[0] == std::string("thing"));
            CHECK(run_info->context_tags.keys[1] == std::string("foo"));
            CHECK(run_info->context_tags.values[0] == std::string("thing_val"));
            CHECK(run_info->context_tags.values[1] == std::string("foo_val"));
        };

        RunInfoDictData * run_info_data_out_1 = nullptr;
        CHECK_POD5_OK(pod5_get_file_run_info(file, 0, &run_info_data_out_1));
        check_run_info(run_info_data_out_1);
        pod5_free_run_info(run_info_data_out_1);

        RunInfoDictData * run_info_data_out_2 = nullptr;
        CHECK_POD5_OK(pod5_get_run_info(batch_0, 0, &run_info_data_out_2));
        check_run_info(run_info_data_out_2);
        pod5_free_run_info(run_info_data_out_2);

        pod5_free_read_batch(batch_0);

        pod5_close_and_free_reader(file);
        CHECK_POD5_OK(pod5_get_error_no());
    }
}

SCENARIO("C API Many Reads")
{
    static constexpr char const * filename = "./foo_c_api.pod5";

    pod5_init();
    auto fin = gsl::finally([] { pod5_terminate(); });

    std::mt19937 gen{Catch::rngSeed()};
    auto uuid_gen = pod5::UuidRandomGenerator{gen};
    std::vector<int16_t> signal_1(10);
    std::iota(signal_1.begin(), signal_1.end(), -20000);

    std::vector<int16_t> signal_2(20);
    std::iota(signal_2.begin(), signal_2.end(), 0);

    std::size_t const read_count = 10037;

    std::int16_t const adc_min = -4096;
    std::int16_t const adc_max = 4095;

    std::vector<pod5::Uuid> read_id_array(read_count);
    std::generate(read_id_array.begin(), read_id_array.end(), uuid_gen);

    // Write the file:
    {
        CHECK_POD5_OK(pod5_get_error_no());
        CHECK_FALSE(pod5_create_file(NULL, "c_software", NULL));
        CHECK(pod5_get_error_no() == POD5_ERROR_INVALID);
        CHECK_FALSE(pod5_create_file("", "c_software", NULL));
        CHECK(pod5_get_error_no() == POD5_ERROR_INVALID);
        CHECK_FALSE(pod5_create_file("", NULL, NULL));
        CHECK(pod5_get_error_no() == POD5_ERROR_INVALID);

        REQUIRE(remove_file_if_exists(filename).ok());

        auto file = pod5_create_file(filename, "c_software", NULL);
        REQUIRE(file);
        CHECK_POD5_OK(pod5_get_error_no());

        std::int16_t pore_type_id = -1;
        CHECK_POD5_OK(pod5_add_pore(&pore_type_id, file, "pore_type"));
        CHECK(pore_type_id == 0);

        std::vector<char const *> context_tags_keys{"thing", "foo"};
        std::vector<char const *> context_tags_values{"thing_val", "foo_val"};
        std::vector<char const *> tracking_id_keys{"baz", "other"};
        std::vector<char const *> tracking_id_values{"baz_val", "other_val"};

        std::int16_t run_info_id = -1;
        CHECK_POD5_OK(pod5_add_run_info(
            &run_info_id,
            file,
            "acquisition_id",
            15400,
            adc_max,
            adc_min,
            context_tags_keys.size(),
            context_tags_keys.data(),
            context_tags_values.data(),
            "experiment_name",
            "flow_cell_id",
            "flow_cell_product_code",
            "protocol_name",
            "protocol_run_id",
            200000,
            "sample_id",
            4000,
            "sequencing_kit",
            "sequencer_position",
            "sequencer_position_type",
            "software",
            "system_name",
            "system_type",
            tracking_id_keys.size(),
            tracking_id_keys.data(),
            tracking_id_values.data()));
        CHECK(run_info_id == 0);

        std::vector<std::uint32_t> read_number(read_count, 12);
        std::vector<std::uint64_t> start_sample(read_count, 10245);
        std::vector<float> median_before(read_count, 200.0f);
        std::vector<std::uint16_t> channel(read_count, 43);
        std::vector<std::uint8_t> well(read_count, 4);
        std::vector<pod5_end_reason_t> end_reason(read_count, POD5_END_REASON_MUX_CHANGE);
        std::vector<uint8_t> end_reason_forced(read_count, false);

        std::vector<float> calibration_offset(read_count, 54.0f);
        std::vector<float> calibration_scale(read_count, 100.0f);

        std::vector<float> predicted_scale(read_count, 2.3f);
        std::vector<float> predicted_shift(read_count, 10.0f);
        std::vector<float> tracked_scale(read_count, 4.3f);
        std::vector<float> tracked_shift(read_count, 15.0f);
        std::vector<std::uint32_t> num_reads_since_mux_change(read_count, 1234);
        std::vector<float> time_since_mux_change(read_count, 2.4f);
        std::vector<float> open_pore_level(read_count, 123.0f);
        std::vector<std::uint64_t> num_minknow_events(read_count, 104);

        std::vector<std::int16_t> pore_type_ids(read_count, pore_type_id);
        std::vector<std::int16_t> run_info_ids(read_count, run_info_id);

        std::vector<std::int16_t const *> signal_arr;
        std::vector<std::uint32_t> signal_size;
        ReadBatchRowInfoArrayV4 row_data{
            (read_id_t *)read_id_array.data(),
            read_number.data(),
            start_sample.data(),
            median_before.data(),
            channel.data(),
            well.data(),
            pore_type_ids.data(),
            calibration_offset.data(),
            calibration_scale.data(),
            end_reason.data(),
            end_reason_forced.data(),
            run_info_ids.data(),
            num_minknow_events.data(),
            tracked_scale.data(),
            tracked_shift.data(),
            predicted_scale.data(),
            predicted_shift.data(),
            num_reads_since_mux_change.data(),
            time_since_mux_change.data(),
            open_pore_level.data()};

        for (std::size_t i = 0; i < read_count; ++i) {
            signal_arr.push_back(signal_1.data());
            signal_size.push_back((std::uint32_t)signal_1.size());
        }

        CHECK_POD5_OK(pod5_add_reads_data(
            file,
            read_count,
            READ_BATCH_ROW_INFO_VERSION_3,
            &row_data,
            signal_arr.data(),
            signal_size.data()));

        CHECK_POD5_OK(pod5_close_and_free_writer(file));
        CHECK_POD5_OK(pod5_get_error_no());
    }

    // Read the file back:
    {
        Pod5ReaderOptions_t options{};
        options.force_disable_file_mapping = true;

        CHECK_POD5_OK(pod5_get_error_no());
        CHECK_FALSE(pod5_open_file_options(NULL, &options));
        CHECK_FALSE(pod5_open_file_options(filename, NULL));
        auto file = pod5_open_file_options(filename, &options);
        CHECK_POD5_OK(pod5_get_error_no());
        CHECK(file);

        FileInfo_t file_info;
        CHECK_POD5_OK(pod5_get_file_info(file, &file_info));
        CHECK(file_info.version.major == pod5::Pod5MajorVersion);
        CHECK(file_info.version.minor == pod5::Pod5MinorVersion);
        CHECK(file_info.version.revision == pod5::Pod5RevVersion);
        {
            auto reader = pod5::open_file_reader(filename);
            pod5::Uuid file_identifier{file_info.file_identifier};
            CHECK(file_identifier == (*reader)->schema_metadata().file_identifier);
        }

        std::size_t read_count_returned = 0;
        CHECK_POD5_OK(pod5_get_read_count(file, &read_count_returned));
        REQUIRE(read_count_returned == read_count);

        // Randomise the order of the read IDs and then try and plan a path through them.
        std::shuffle(read_id_array.begin(), read_id_array.end(), gen);
        std::vector<std::uint32_t> batch_counts(read_count);
        std::vector<std::uint32_t> batch_rows(read_count);
        std::size_t find_success_count = 0;
        CHECK_POD5_OK(pod5_plan_traversal(
            file,
            reinterpret_cast<uint8_t const *>(read_id_array.data()),
            read_count,
            batch_counts.data(),
            batch_rows.data(),
            &find_success_count));
        REQUIRE(find_success_count == read_count);

        CHECK_POD5_OK(pod5_close_and_free_reader(file));
    }
}

SCENARIO("C API Run Info")
{
    static constexpr char const * filename = "./foo_c_api.pod5";

    pod5_init();
    auto fin = gsl::finally([] { pod5_terminate(); });

    std::int16_t adc_min = -4096;
    std::int16_t adc_max = 4095;

    auto expected_acq_id = [](std::size_t index) {
        std::string acquisition_id{"acquisition_id_"};
        acquisition_id += std::to_string(index);
        return acquisition_id;
    };

    // Write the file:
    {
        REQUIRE(remove_file_if_exists(filename).ok());

        auto file = pod5_create_file(filename, "c_software", NULL);
        REQUIRE(file);
        CHECK_POD5_OK(pod5_get_error_no());

        std::vector<char const *> context_tags_keys{"thing", "foo"};
        std::vector<char const *> context_tags_values{"thing_val", "foo_val"};
        std::vector<char const *> tracking_id_keys{"baz", "other"};
        std::vector<char const *> tracking_id_values{"baz_val", "other_val"};

        for (std::size_t i = 0; i < 10; ++i) {
            std::int16_t run_info_id = -1;
            CHECK_POD5_OK(pod5_add_run_info(
                &run_info_id,
                file,
                expected_acq_id(i).c_str(),
                15400,
                adc_max,
                adc_min,
                context_tags_keys.size(),
                context_tags_keys.data(),
                context_tags_values.data(),
                "experiment_name",
                "flow_cell_id",
                "flow_cell_product_code",
                "protocol_name",
                "protocol_run_id",
                200000,
                "sample_id",
                4000,
                "sequencing_kit",
                "sequencer_position",
                "sequencer_position_type",
                "software",
                "system_name",
                "system_type",
                tracking_id_keys.size(),
                tracking_id_keys.data(),
                tracking_id_values.data()));
            CHECK(run_info_id == static_cast<std::int16_t>(i));
        }
        CHECK_POD5_OK(pod5_close_and_free_writer(file));
    }

    // Read the file back:
    {
        CHECK_POD5_OK(pod5_get_error_no());
        CHECK_FALSE(pod5_open_file(NULL));
        auto file = pod5_open_file(filename);
        CHECK_POD5_OK(pod5_get_error_no());
        CHECK(pod5_get_error_string() == std::string{""});
        REQUIRE(file);

        run_info_index_t run_info_count = 0;
        CHECK_POD5_OK(pod5_get_file_run_info_count(file, &run_info_count));
        REQUIRE(run_info_count == 10);

        for (run_info_index_t i = 0; i < 10; ++i) {
            RunInfoDictData * run_info_data_out = nullptr;
            CHECK_POD5_OK(pod5_get_file_run_info(file, i, &run_info_data_out));
            CHECK(run_info_data_out->acquisition_id == expected_acq_id(i));
            pod5_free_run_info(run_info_data_out);
        }

        CHECK_POD5_OK(pod5_close_and_free_reader(file));
    }
}

TEST_CASE("Missing file passed to pod5_open_file")
{
    pod5_init();
    auto cleanup = gsl::finally([] { pod5_terminate(); });

    static constexpr char const temporary_filename[] = "./foo_c_api.pod5";
    REQUIRE(remove_file_if_exists(temporary_filename).ok());

    CHECK(pod5_open_file(temporary_filename) == nullptr);
}

TEST_CASE("Existing file passed to pod5_create_file")
{
    pod5_init();
    auto cleanup = gsl::finally([] { pod5_terminate(); });

    static constexpr char const temporary_filename[] = "./foo_c_api.pod5";
    REQUIRE(remove_file_if_exists(temporary_filename).ok());

    // Create it once.
    Pod5FileWriter_t * writer = pod5_create_file(temporary_filename, "c_software", nullptr);
    REQUIRE_POD5_OK(pod5_get_error_no());
    REQUIRE(writer != nullptr);
    REQUIRE_POD5_OK(pod5_close_and_free_writer(writer));

    // File already exists so this should fail.
    CHECK(pod5_create_file(temporary_filename, "c_software", nullptr) == nullptr);
}

TEST_CASE("pod5_create_file with options")
{
    pod5_init();
    auto cleanup = gsl::finally([] { pod5_terminate(); });

    static constexpr char const temporary_filename[] = "./foo_c_api.pod5";
    REQUIRE(remove_file_if_exists(temporary_filename).ok());

    Pod5WriterOptions_t test_options{};
    Pod5WriterOptions_t const * options = nullptr;
    bool const with_options = GENERATE(false, true);
    if (with_options) {
        options = &test_options;
    } else {
        test_options.max_signal_chunk_size = GENERATE(0, 1, 2);
        test_options.signal_compression_type = GENERATE(
            CompressionOption::DEFAULT_SIGNAL_COMPRESSION,
            CompressionOption::VBZ_SIGNAL_COMPRESSION,
            CompressionOption::UNCOMPRESSED_SIGNAL);
        test_options.signal_table_batch_size = GENERATE(0, 1, 2);
        test_options.read_table_batch_size = GENERATE(0, 1, 2);
    }

    CAPTURE(
        with_options,
        test_options.max_signal_chunk_size,
        test_options.signal_compression_type,
        test_options.signal_table_batch_size,
        test_options.read_table_batch_size);

    Pod5FileWriter_t * writer = pod5_create_file(temporary_filename, "c_software", options);
    REQUIRE_POD5_OK(pod5_get_error_no());
    REQUIRE(writer != nullptr);
    REQUIRE_POD5_OK(pod5_close_and_free_writer(writer));
}

TEST_CASE("VBZ compression")
{
    pod5_init();
    auto cleanup = gsl::finally([] { pod5_terminate(); });

    std::size_t const sample_count = 20;
    std::vector<int16_t> input_signal(sample_count);
    std::iota(input_signal.begin(), input_signal.end(), -sample_count / 2);

    // Determine max size.
    std::size_t const compressed_read_max_size =
        pod5_vbz_compressed_signal_max_size(input_signal.size());
    REQUIRE(compressed_read_max_size > 0);

    // Compress it.
    std::vector<char> compressed_signal(compressed_read_max_size);
    std::size_t compressed_size = compressed_read_max_size;
    REQUIRE_POD5_OK(pod5_vbz_compress_signal(
        input_signal.data(), input_signal.size(), compressed_signal.data(), &compressed_size));
    REQUIRE(compressed_size <= compressed_read_max_size);
    compressed_signal.resize(compressed_size);

    // Decompress it.
    std::vector<int16_t> output_signal(sample_count);
    REQUIRE_POD5_OK(pod5_vbz_decompress_signal(
        compressed_signal.data(), compressed_signal.size(), sample_count, output_signal.data()));
    REQUIRE(input_signal == output_signal);

    // Providing incorrect buffer sizes should fail rather than crash.
    CHECK_POD5_NOT_OK(pod5_vbz_decompress_signal(
        compressed_signal.data(),
        compressed_signal.size(),
        sample_count * 2,
        output_signal.data()));
    std::size_t bad_compressed_size = compressed_size / 2;
    CHECK_POD5_NOT_OK(pod5_vbz_compress_signal(
        input_signal.data(), input_signal.size(), compressed_signal.data(), &bad_compressed_size));

    // Going over the maximum size should produce an error.
    size_t const max_size_error = pod5_vbz_compressed_signal_max_size(std::uint64_t{1} << 48);
    CHECK(max_size_error == 0);
    CHECK_POD5_NOT_OK(pod5_get_error_no());
}


================================================
FILE: c++/test/file_reader_writer_tests.cpp
================================================
#include "pod5_format/async_signal_loader.h"
#include "pod5_format/file_reader.h"
#include "pod5_format/file_writer.h"
#include "pod5_format/internal/combined_file_utils.h"
#include "pod5_format/read_table_reader.h"
#include "pod5_format/signal_table_reader.h"
#include "pod5_format/thread_pool.h"
#include "pod5_format/uuid.h"
#include "TemporaryDirectory.h"
#include "test_utils.h"
#include "utils.h"

#include <arrow/array/array_binary.h>
#include <arrow/array/array_dict.h>
#include <arrow/array/array_primitive.h>
#include <arrow/io/file.h>
#include <arrow/memory_pool.h>
#include <catch2/catch.hpp>

#include <chrono>
#include <fstream>
#include <numeric>
#include <string>
#include <thread>

void run_file_reader_writer_tests(
    char const * file,
    pod5::FileWriterOptions const & extra_options = {})
{
    REQUIRE_ARROW_STATUS_OK(remove_file_if_exists(file));
    (void)pod5::register_extension_types();
    auto fin = gsl::finally([] { (void)pod5::unregister_extension_types(); });

    auto const run_info_data = get_test_run_info_data("_run_info");

    std::mt19937 gen{Catch::rngSeed()};
    auto uuid_gen = pod5::UuidRandomGenerator{gen};
    auto read_id_1 = uuid_gen();

    std::uint16_t channel = 25;
    std::uint8_t well = 3;
    std::uint32_t read_number = 1234;
    std::uint64_t start_sample = 12340;
    std::uint64_t num_minknow_events = 27;
    float median_before = 224.0f;
    float calib_offset = 22.5f;
    float calib_scale = 1.2f;
    float tracked_scaling_scale = 2.3f;
    float tracked_scaling_shift = 100.0f;
    float predicted_scaling_scale = 1.5f;
    float predicted_scaling_shift = 50.0f;
    std::uint32_t num_reads_since_mux_change = 3;
    float time_since_mux_change = 200.0f;
    float open_pore_level = 150.0f;

    std::vector<std::int16_t> signal_1(100'000);
    std::iota(signal_1.begin(), signal_1.end(), 0);

    // Write a file:
    {
        pod5::FileWriterOptions options = extra_options;
        options.set_max_signal_chunk_size(20'480);
        options.set_read_table_batch_size(1);
        options.set_signal_table_batch_size(5);

        auto writer = pod5::create_file_writer(file, "test_software", options);
        REQUIRE_ARROW_STATUS_OK(writer);

        auto run_info = (*writer)->add_run_info(run_info_data);
        auto end_reason = (*writer)->lookup_end_reason(pod5::ReadEndReason::signal_negative);
        bool end_reason_forced = true;
        auto pore_type = (*writer)->add_pore_type("Pore_type");

        for (std::size_t i = 0; i < 10; ++i) {
            CHECK_ARROW_STATUS_OK((*writer)->add_complete_read(
                {read_id_1,
                 read_number,
                 start_sample,
                 channel,
                 well,
                 *pore_type,
                 calib_offset,
                 calib_scale,
                 median_before,
                 *end_reason,
                 end_reason_forced,
                 *run_info,
                 num_minknow_events,
                 tracked_scaling_scale,
                 tracked_scaling_shift,
                 predicted_scaling_scale,
                 predicted_scaling_shift,
                 num_reads_since_mux_change,
                 time_since_mux_change,
                 open_pore_level},
                gsl::make_span(signal_1)));
        }
    }

    // Open the file for reading:
    // Write a file:
    {
        auto reader = pod5::open_file_reader(file, {});
        REQUIRE_ARROW_STATUS_OK(reader);

        REQUIRE((*reader)->num_read_record_batches() == 10);
        for (std::size_t i = 0; i < 10; ++i) {
            auto read_batch = (*reader)->read_read_record_batch(i);
            REQUIRE_ARROW_STATUS_OK(read_batch);

            auto read_id_array = read_batch->read_id_column();
            CHECK(read_id_array->length() == 1);
            CHECK(read_id_array->Value(0) == read_id_1);

            auto columns = *read_batch->columns();
            auto const run_info_dict_index =
                std::dynamic_pointer_cast<arrow::Int16Array>(columns.run_info->indices())->Value(0);
            CHECK(run_info_dict_index == 0);
            auto const run_info_id = read_batch->get_run_info(run_info_dict_index);
            CHECK(*run_info_id == run_info_data.acquisition_id);
            auto const run_info = (*reader)->find_run_info(*run_info_id);
            CHECK(**run_info == run_info_data);

            REQUIRE((*reader)->num_signal_record_batches() == 10);
            auto signal_batch = (*reader)->read_signal_record_batch(i);
            REQUIRE_ARROW_STATUS_OK(signal_batch);

            auto signal_read_id_array = signal_batch->read_id_column();
            CHECK(signal_read_id_array->length() == 5);
            CHECK(signal_read_id_array->Value(0) == read_id_1);
            CHECK(signal_read_id_array->Value(1) == read_id_1);
            CHECK(signal_read_id_array->Value(2) == read_id_1);
            CHECK(signal_read_id_array->Value(3) == read_id_1);
            CHECK(signal_read_id_array->Value(4) == read_id_1);

            auto vbz_signal_array = signal_batch->vbz_signal_column();
            CHECK(vbz_signal_array->length() == 5);

            auto samples_array = signal_batch->samples_column();
            CHECK(samples_array->Value(0) == 20'480);
            CHECK(samples_array->Value(1) == 20'480);
            CHECK(samples_array->Value(2) == 20'480);
            CHECK(samples_array->Value(3) == 20'480);
            CHECK(samples_array->Value(4) == 18'080);
        }

        auto const samples_mode = GENERATE(
            pod5::AsyncSignalLoader::SamplesMode::NoSamples,
            pod5::AsyncSignalLoader::SamplesMode::Samples);

        pod5::AsyncSignalLoader async_no_samples_loader(
            *reader,
            samples_mode,
            {},  // Read all the batches
            {}   // No specific rows within batches)
        );

        for (std::size_t i = 0; i < 10; ++i) {
            CAPTURE(i);
            auto first_batch_res = async_no_samples_loader.release_next_batch();
            REQUIRE_ARROW_STATUS_OK(first_batch_res);
            auto first_batch = std::move(*first_batch_res);
            CHECK(first_batch->batch_index() == i);

            CHECK(first_batch->sample_count().size() == 1);
            CHECK(first_batch->sample_count()[0] == signal_1.size());

            CHECK(first_batch->samples().size() == 1);
            if (samples_mode == pod5::AsyncSignalLoader::SamplesMode::Samples) {
                CHECK(first_batch->samples()[0] == signal_1);
            } else {
                CHECK(first_batch->samples()[0].size() == 0);
            }
        }
    }
}

SCENARIO("File Reader Writer Tests") { run_file_reader_writer_tests("./foo.pod5"); }

#ifdef __linux__
TEST_CASE("Additional make_file_stream() tests")
{
    // When the user filesystem doesn't support direct-io, but it is requested then
    // make_file_stream() should fallback to a "regular" FileOutputStream

    // This because of the disk mounting, this test can only be run by someone or something that
    // is effectively a root user.
    if (::geteuid() != 0) {
        WARN("SKIPPING TEST: Need root privileges to mount a test drive.");
        return;
    }

    std::filesystem::path const dir_path = "./ramdisk_" + std::to_string(std::time(nullptr));

    // Create and mount tmpfs drive.
    try {
        std::filesystem::create_directory(dir_path);
        auto const mount_cmd = std::string{"mount -o size=500M -t tmpfs none "} + dir_path.string();
        auto const mount_return = std::system(mount_cmd.c_str());
        if (mount_return != 0) {
            // we have seen this fail in CI where the test thinks it can mount
            // but CI fails to mount, just skip the test
            WARN("SKIPPING TEST: Need root privileges to mount a test drive.");
            return;
        }
    } catch (std::exception const & e) {
        FAIL("Failed to create and mount a tmpfs drive: " << e.what());
    }

    auto const umount_cmd = std::string{"umount "} + dir_path.string();
    auto remove_directory = gsl::finally([&] { std::filesystem::remove(dir_path); });
    auto remove_mount = gsl::finally([&] { std::ignore = std::system(umount_cmd.c_str()); });

    pod5::FileWriterOptions options_for_direct_io;
    options_for_direct_io.set_use_directio(true);
    options_for_direct_io.set_use_sync_io(true);
    options_for_direct_io.set_write_chunk_size(524288);

    try {
        auto const test_file_path = dir_path / "bar.pod5";
        run_file_reader_writer_tests(test_file_path.c_str(), options_for_direct_io);
    } catch (std::exception const & e) {
        FAIL("Failed to run file reader/writer tests: " << e.what());
    }
}
#endif

SCENARIO("Opening older files")
{
    (void)pod5::register_extension_types();
    auto fin = gsl::finally([] { (void)pod5::unregister_extension_types(); });

    auto uuid_from_string = [](char const * val) -> pod5::Uuid {
        auto result = pod5::Uuid::from_string(val);
        REQUIRE(result);
        return *result;
    };

    struct ReadData {
        pod5::Uuid read_id;
        std::uint32_t read_number;
        float calibration_offset;
        float calibration_scale;
        std::string end_reason;
        std::string pore_type;
        std::string run_info_id;
    };

    std::vector<ReadData> test_read_data{
        {{uuid_from_string("0000173c-bf67-44e7-9a9c-1ad0bc728e74")},
         1093,
         21.0f,
         0.1755f,
         "unknown",
         "not_set",
         "a08e850aaa44c8b56765eee10b386fc3e516a62b"},
        {{uuid_from_string("002fde30-9e23-4125-9eae-d112c18a81a7")},
         75,
         4.0f,
         0.1755f,
         "unknown",
         "not_set",
         "a08e850aaa44c8b56765eee10b386fc3e516a62b"},
        {{uuid_from_string("006d1319-2877-4b34-85df-34de7250a47b")},
         1053,
         6.0f,
         0.1755f,
         "unknown",
         "not_set",
         "a08e850aaa44c8b56765eee10b386fc3e516a62b"},
        {{uuid_from_string("00728efb-2120-4224-87d8-580fbb0bd4b2")},
         657,
         2.0f,
         0.1755f,
         "unknown",
         "not_set",
         "a08e850aaa44c8b56765eee10b386fc3e516a62b"},
        {{uuid_from_string("007cc97e-6de2-4ff6-a0fd-1c1eca816425")},
         1625,
         23.0f,
         0.1755f,
         "unknown",
         "not_set",
         "a08e850aaa44c8b56765eee10b386fc3e516a62b"},
        {{uuid_from_string("008468c3-e477-46c4-a6e2-7d021a4ebf0b")},
         411,
         4.0f,
         0.1755f,
         "unknown",
         "not_set",
         "a08e850aaa44c8b56765eee10b386fc3e516a62b"},
        {{uuid_from_string("008ed3dc-86c2-452f-b107-6877a473d177")},
         513,
         5.0f,
         0.1755f,
         "unknown",
         "not_set",
         "a08e850aaa44c8b56765eee10b386fc3e516a62b"},
        {{uuid_from_string("00919556-e519-4960-8aa5-c2dfa020980c")},
         56,
         2.0f,
         0.1755f,
         "unknown",
         "not_set",
         "a08e850aaa44c8b56765eee10b386fc3e516a62b"},
        {{uuid_from_string("00925f34-6baf-47fc-b40c-22591e27fb5c")},
         930,
         37.0f,
         0.1755f,
         "unknown",
         "not_set",
         "a08e850aaa44c8b56765eee10b386fc3e516a62b"},
        {{uuid_from_string("009dc9bd-c5f4-487b-ba4c-b9ce7e3a711e")},
         195,
         14.0f,
         0.1755f,
         "unknown",
         "not_set",
         "a08e850aaa44c8b56765eee10b386fc3e516a62b"},
    };

    auto repo_root =
        ::arrow::internal::PlatformFilename::FromString(__FILE__)->Parent().Parent().Parent();
    auto path = GENERATE_COPY(
        *repo_root.Join("test_data/multi_fast5_zip_v0.pod5"),
        *repo_root.Join("test_data/multi_fast5_zip_v1.pod5"),
        *repo_root.Join("test_data/multi_fast5_zip_v2.pod5"),
        *repo_root.Join("test_data/multi_fast5_zip_v3.pod5"),
        *repo_root.Join("test_data/multi_fast5_zip_v4.pod5"));
    auto reader = pod5::open_file_reader(path.ToString(), {});
    CHECK_ARROW_STATUS_OK(reader);

    auto metadata = (*reader)->schema_metadata();
    CHECK(metadata.writing_software == "Python API");

    std::size_t abs_row = 0;

    for (std::size_t i = 0; i < (*reader)->num_read_record_batches(); ++i) {
        auto batch = (*reader)->read_read_record_batch(i);

        auto columns = batch->columns();
        REQUIRE_ARROW_STATUS_OK(columns);

        for (std::size_t row = 0; row < batch->num_rows(); ++row) {
            CAPTURE(abs_row);
            auto read_data = test_read_data[row];
            CHECK(columns->read_id->Value(row) == read_data.read_id);
            CHECK(columns->read_number->Value(row) == read_data.read_number);
            CHECK(columns->calibration_offset->Value(row) == read_data.calibration_offset);
            CHECK(columns->calibration_scale->Value(row) == Approx(read_data.calibration_scale));
            auto end_reason = *batch->get_end_reason(columns->end_reason->GetValueIndex(row));
            CHECK(end_reason.first == pod5::end_reason_from_string(read_data.end_reason));
            CHECK(end_reason.second == read_data.end_reason);
            auto pore_type = batch->get_pore_type(columns->pore_type->GetValueIndex(row));
            CHECK(*pore_type == read_data.pore_type);
            auto run_info_id = batch->get_run_info(columns->run_info->GetValueIndex(row));
            CHECK(*run_info_id == read_data.run_info_id);

            ++abs_row;
        }
    }
    CHECK(abs_row == test_read_data.size());

    auto run_info = (*reader)->find_run_info(test_read_data[0].run_info_id);
    REQUIRE_ARROW_STATUS_OK(run_info);
    CHECK((*run_info)->acquisition_id == test_read_data[0].run_info_id);
    CHECK((*run_info)->adc_min == -4096);
    CHECK((*run_info)->adc_max == 4095);
    CHECK((*run_info)->protocol_run_id == "df049455-3552-438c-8176-d4a5b1dd9fc5");
    CHECK((*run_info)->software == "python-pod5-converter");
    CHECK(
        (*run_info)->tracking_id
        == pod5::RunInfoData::MapType{
            {"asic_id", "131070"},
            {"asic_id_eeprom", "0"},
            {"asic_temp", "35.043102"},
            {"asic_version", "IA02C"},
            {"auto_update", "0"},
            {"auto_update_source", "https://mirror.oxfordnanoportal.com/software/MinKNOW/"},
            {"bream_is_standard", "0"},
            {"device_id", "MS00000"},
            {"device_type", "minion"},
            {"distribution_status", "modified"},
            {"distribution_version", "unknown"},
            {"exp_script_name", "c449127e3461a521e0865fe6a88716f6f6b0b30c"},
            {"exp_script_purpose", "sequencing_run"},
            {"exp_start_time", "2019-05-13T11:11:43Z"},
            {"flow_cell_id", ""},
            {"guppy_version", "3.0.3+7e7b7d0"},
            {"heatsink_temp", "35.000000"},
            {"hostname", "happy_fish"},
            {"installation_type", "prod"},
            {"local_firmware_file", "1"},
            {"operating_system", "ubuntu 16.04"},
            {"protocol_group_id", "TEST_EXPERIMENT"},
            {"protocol_run_id", "df049455-3552-438c-8176-d4a5b1dd9fc5"},
            {"protocols_version", "4.0.6"},
            {"run_id", "a08e850aaa44c8b56765eee10b386fc3e516a62b"},
            {"sample_id", "TEST_SAMPLE"},
            {"usb_config", "MinION_fx3_1.1.1_ONT#MinION_fpga_1.1.0#ctrl#Auto"},
            {"version", "3.4.0-rc3"},
        });
}

/// Create empty file at \p path.
static void touch(std::filesystem::path const & path) { std::ofstream const ofs(path); }

/// Create file containing bytes of value zero at \p path.
static void write_zeros(std::filesystem::path const & path)
{
    std::ofstream file_stream(path, std::ios::binary);
    for (int i = 0; i < 1000000; ++i) {
        file_stream.put('\0');
    }
}

/// Returns true iff the file exists and contains non-null data.
static bool file_writing_started(std::filesystem::path const & file_path)
{
    if (!exists(file_path)) {
        return false;
    }
    if (!is_regular_file(file_path)) {
        return false;
    }
    // This should be enough for the check as unwritten files are usually
    // empty or populated with nulls if writing has not been done.
    auto const MINIMUM_BYTES_WRITTEN = 3;
    if (file_size(file_path) < 3) {
        return false;
    }
    std::ifstream file{file_path, std::ios::in | std::ios::binary};
    for (auto byte_index = 0; byte_index < MINIMUM_BYTES_WRITTEN; ++byte_index) {
        std::uint8_t byte;
        file >> byte;
        if (byte == 0) {
            return false;
        }
    }
    return true;
}

static bool files_ready_to_recover(std::filesystem::path const & directory_path)
{
    using directory_iterator = std::filesystem::directory_iterator;
    // The directory should contain 3 files for recovery. A `pod5.tmp` with the signal data
    // a `.tmp-reads` for the reads and a `.tmp-run-info` for the run information.
    return std::count_if(
               directory_iterator(directory_path), directory_iterator{}, file_writing_started)
           >= 3;
}

static void wait_for_files_to_recover(std::filesystem::path const & directory_path)
{
    using clock = std::chrono::steady_clock;
    auto const begin_waiting = clock::now();
    auto const time_waited = [&]() {
        return std::chrono::duration_cast<std::chrono::milliseconds>(clock::now() - begin_waiting);
    };

    while (!files_ready_to_recover(directory_path)) {
        REQUIRE(time_waited() < std::chrono::milliseconds{100000});
        // Give any asynchronous file writing threads a chance to write to disk, before we continue.
        std::this_thread::sleep_for(std::chrono::milliseconds{100});
    }
}

static std::filesystem::path create_files_for_recovery(
    std::string const & file_name,
    pod5::Uuid read_id_1,
    ont::testutils::TemporaryDirectory & recovery_directory)
{
    auto const run_info_data = get_test_run_info_data("_run_info");

    std::uint16_t channel = 25;
    std::uint8_t well = 3;
    std::uint32_t read_number = 1234;
    std::uint64_t start_sample = 12340;
    std::uint64_t num_minknow_events = 27;
    float median_before = 224.0f;
    float calib_offset = 22.5f;
    float calib_scale = 1.2f;
    float tracked_scaling_scale = 2.3f;
    float tracked_scaling_shift = 100.0f;
    float predicted_scaling_scale = 1.5f;
    float predicted_scaling_shift = 50.0f;
    std::uint32_t num_reads_since_mux_change = 3;
    float time_since_mux_change = 200.0f;
    float open_pore_level = 150.0f;

    std::vector<std::int16_t> signal_1(100'000);
    std::iota(signal_1.begin(), signal_1.end(), 0);

    ont::testutils::TemporaryDirectory data_writing_directory;
    auto file = data_writing_directory.path() / file_name;

    pod5::FileWriterOptions options;
    options.set_max_signal_chunk_size(20'480);
    options.set_read_table_batch_size(1);
    options.set_signal_table_batch_size(5);
    options.set_use_sync_io(true);
    auto thread_pool = pod5::make_thread_pool(4);
    options.set_thread_pool(thread_pool);

    auto writer_result = pod5::create_file_writer(file.string(), "test_software", options);
    REQUIRE_ARROW_STATUS_OK(writer_result);
    std::unique_ptr<pod5::FileWriter> writer = std::move(*writer_result);

    auto run_info = writer->add_run_info(run_info_data);
    auto end_reason = writer->lookup_end_reason(pod5::ReadEndReason::signal_negative);
    bool end_reason_forced = true;
    auto pore_type = writer->add_pore_type("Pore_type");

    for (std::size_t i = 0; i < 10; ++i) {
        CHECK_ARROW_STATUS_OK(writer->add_complete_read(
            {read_id_1,
             read_number,
             start_sample,
             channel,
             well,
             *pore_type,
             calib_offset,
             calib_scale,
             median_before,
             *end_reason,
             end_reason_forced,
             *run_info,
             num_minknow_events,
             tracked_scaling_scale,
             tracked_scaling_shift,
             predicted_scaling_scale,
             predicted_scaling_shift,
             num_reads_since_mux_change,
             time_since_mux_change,
             open_pore_level},
            gsl::make_span(signal_1)));
    }

    wait_for_files_to_recover(data_writing_directory.path());

    // Intermittent failures were seen on Windows, where the file was in the middle of being
    // written when we copied it. This ensures that the file writing threads are done before
    // we take the files.
    thread_pool->wait_for_drain();

    // The files are deliberately copied here before they can be properly finalised
    // by the destructor of the FileWriter.
    std::filesystem::copy(data_writing_directory.path(), recovery_directory.path());

    REQUIRE(files_ready_to_recover(recovery_directory.path()));

    return recovery_directory.path() / file_name;
}

/// This is equivalent to the C++20 `std::string::ends_with` function. It should be replaced with
/// the standard library function once we move to the C++20 standard and drop support for building
/// with GCC 8.
static bool ends_with(std::string const & search_in, std::string const & suffix)
{
    if (suffix.size() > search_in.size()) {
        return false;
    }
    return search_in.compare(search_in.size() - suffix.size(), std::string::npos, suffix) == 0;
}

TEST_CASE("Check custom rolled ends_with works", "[string_utilities]")
{
    CHECK(ends_with("abc", "abc"));
    CHECK(ends_with("abcdef", "def"));
    CHECK_FALSE(ends_with("abcdef", "abc"));
    CHECK_FALSE(ends_with("def", "abcdef"));
    CHECK_FALSE(ends_with("abc", "def"));
}

static std::string escape_for_regex(std::string const & input)
{
    std::string output;
    for (auto const & character : input) {
        switch (character) {
        case '\\':
        case '/':
        case '.':
        case '[':
        case ']':
        case '(':
        case ')':
            output += std::string("\\");
        default:;
        }
        output += character;
    }
    return output;
}

TEST_CASE("Recovering .pod5.tmp files", "[recovery]")
{
    std::string const file_name = "foo.pod5.tmp";
    ont::testutils::TemporaryDirectory recovery_directory;
    auto const registration_status = pod5::register_extension_types();
    REQUIRE(registration_status.ok());
    auto const unregister = [] { (void)pod5::unregister_extension_types(); };
    auto fin = std::make_unique<gsl::final_action<decltype(unregister)>>(unregister);
    std::mt19937 gen{Catch::rngSeed()};
    auto uuid_gen = pod5::UuidRandomGenerator{gen};
    std::filesystem::path const path_to_recover =
        create_files_for_recovery(file_name, uuid_gen(), recovery_directory);

    REQUIRE(exists(path_to_recover));
    std::filesystem::path reads_path, run_path;
    for (auto const & directory_entry :
         std::filesystem::directory_iterator{recovery_directory.path()})
    {
        if (!directory_entry.is_regular_file()) {
            continue;
        }
        if (ends_with(directory_entry.path().filename().string(), (".tmp-reads"))) {
            reads_path = directory_entry.path();
        }
        if (ends_with(directory_entry.path().filename().string(), (".tmp-run-info"))) {
            run_path = directory_entry.path();
        }
    }
    REQUIRE(exists(reads_path));
    REQUIRE(exists(run_path));
    auto const recovered_file_path = recovery_directory.path() / (file_name + "-recovered.pod5");
    // Confirm that no recovered file is left over from previous test runs.
    REQUIRE_FALSE(exists(recovered_file_path));

    // Paths are implicitly convertible to the kind of strings used for paths
    // on the current platform. On Windows this is an `std::wstring`, but the
    // recover_file_writer takes a `std::string`, so we need the explicit
    // conversion to make the build work on that platform.
    // `generic_string()` is used rather than `native()` because Arrow paths
    // always use `/` as a separator, even on Windows.
    std::string const to_recover = path_to_recover.generic_string();
    std::string const recovered = recovered_file_path.generic_string();

    bool const cleanup = GENERATE(true, false);
    pod5::RecoverFileOptions const options{.cleanup = cleanup};

    CAPTURE(to_recover, recovered, cleanup);

    SECTION("Recovering basic set of .tmp files.")
    {
        auto const recovery_details = pod5::recover_file(to_recover, recovered, options);
        REQUIRE_ARROW_STATUS_OK(recovery_details);
        CHECK(exists(recovered_file_path));
        CHECK(recovery_details->row_counts.run_info == 1);
        CHECK(recovery_details->row_counts.signal == 50);
        CHECK(recovery_details->row_counts.reads == 10);
        CHECK(recovery_details->cleanup_errors.empty());
        if (cleanup) {
            CHECK_FALSE(exists(path_to_recover));
            CHECK_FALSE(exists(reads_path));
            CHECK_FALSE(exists(run_path));
        } else {
            CHECK(exists(path_to_recover));
            CHECK(exists(reads_path));
            CHECK(exists(run_path));
        }
    }

    SECTION("Recovering whilst extensions are not registered.")
    {
        fin = {};
        auto recover_result2 = pod5::recover_file(to_recover, recovered, options);
        REQUIRE_FALSE(recover_result2.ok());
        REQUIRE(
            recover_result2.status().ToString()
            == "Invalid: POD5 library is not correctly initialised.");
        CHECK(exists(path_to_recover));
        CHECK(exists(reads_path));
        CHECK(exists(run_path));
    }

    SECTION("Recovering without run information.")
    {
        remove(run_path);
        std::string const run_info_string = run_path.generic_string();
        CAPTURE(run_info_string);

        SECTION("Recovering set of .tmp files with run info file missing.")
        {
            auto recover_result3 = pod5::recover_file(to_recover, recovered, options);
            REQUIRE_FALSE(recover_result3.ok());
            auto const result_message3 = recover_result3.status().ToString();
            auto const expected_regex3 =
                "IOError: Failed whilst attempting to recover run information from file - "
                + escape_for_regex(run_info_string) + R"(\. Detail: \[(errno|Windows error) 2\] )"
                + R"((No such file or directory|The system cannot find the file specified)[.\n\r]*)";
            REQUIRE_THAT(result_message3, Catch::Matchers::Matches(expected_regex3));
            if (cleanup) {
                CHECK(exists(path_to_recover));
                CHECK(exists(reads_path));
                CHECK_FALSE(exists(run_path));
                CHECK_FALSE(exists(recovered_file_path));
            } else {
                CHECK(exists(path_to_recover));
                CHECK(exists(reads_path));
            }
        }

        SECTION("Recovering set of .tmp files with run info file empty.")
        {
            touch(run_path);
            auto recover_result4 = pod5::recover_file(to_recover, recovered, options);
            REQUIRE_FALSE(recover_result4.ok());
            REQUIRE(
                recover_result4.status().ToString()
                == "Invalid: Failed whilst attempting to recover run information from file - "
                       + run_info_string + ". Detail: File is empty/zero bytes long.");
            if (cleanup) {
                CHECK(exists(path_to_recover));
                CHECK(exists(reads_path));
                CHECK_FALSE(exists(run_path));
                CHECK_FALSE(exists(recovered_file_path));
            } else {
                CHECK(exists(path_to_recover));
                CHECK(exists(reads_path));
                CHECK(exists(run_path));
            }
        }

        SECTION("Recovering set of .tmp files with run info file zeroed.")
        {
            write_zeros(run_path);
            auto recover_result5 = pod5::recover_file(to_recover, recovered, options);
            REQUIRE_FALSE(recover_result5.ok());
            REQUIRE(
                recover_result5.status().ToString()
                == "Invalid: Failed whilst attempting to recover run information from file - "
                       + run_info_string + ". Detail: Not an Arrow file");
            if (cleanup) {
                CHECK(exists(path_to_recover));
                CHECK(exists(reads_path));
                CHECK_FALSE(exists(run_path));
                CHECK_FALSE(exists(recovered_file_path));
            } else {
                CHECK(exists(path_to_recover));
                CHECK(exists(reads_path));
                CHECK(exists(run_path));
            }
        }
    }

    SECTION("Recovering without read information.")
    {
        remove(reads_path);
        std::string const reads_string = reads_path.generic_string();
        CAPTURE(reads_string);

        SECTION("Recovering set of .tmp files with reads file missing.")
        {
            auto recover_result6 = pod5::recover_file(to_recover, recovered, options);
            REQUIRE_FALSE(recover_result6.ok());
            auto const result_message6 = recover_result6.status().ToString();
            auto const expected_regex6 =
                "IOError: Failed whilst attempting to recover reads from file - "
                + escape_for_regex(reads_string) + R"(\. Detail: \[(errno|Windows error) 2\] )"
                + R"((No such file or directory|The system cannot find the file specified)[.\n\r]*)";
            REQUIRE_THAT(result_message6, Catch::Matchers::Matches(expected_regex6));
            if (cleanup) {
                CHECK(exists(path_to_recover));
                CHECK_FALSE(exists(reads_path));
                CHECK(exists(run_path));
                CHECK_FALSE(exists(recovered_file_path));
            } else {
                CHECK(exists(path_to_recover));
                CHECK(exists(run_path));
            }
        }

        SECTION("Recovering set of .tmp files with reads file empty.")
        {
            touch(reads_path);
            auto recover_result7 = pod5::recover_file(to_recover, recovered, options);
            REQUIRE_FALSE(recover_result7.ok());
            REQUIRE(
                recover_result7.status().ToString()
                == "Invalid: Failed whilst attempting to recover reads from file - " + reads_string
                       + ". Detail: File is empty/zero bytes long.");
            if (cleanup) {
                CHECK(exists(path_to_recover));
                CHECK_FALSE(exists(reads_path));
                CHECK(exists(run_path));
                CHECK_FALSE(exists(recovered_file_path));
            } else {
                CHECK(exists(path_to_recover));
                CHECK(exists(reads_path));
                CHECK(exists(run_path));
            }
        }

        SECTION("Recovering set of .tmp files with reads file zeroed.")
        {
            write_zeros(reads_path);
            auto recover_result7 = pod5::recover_file(to_recover, recovered, options);
            REQUIRE_FALSE(recover_result7.ok());
            REQUIRE(
                recover_result7.status().ToString()
                == "Invalid: Failed whilst attempting to recover reads from file - " + reads_string
                       + ". Detail: Not an Arrow file");
            if (cleanup) {
                CHECK(exists(path_to_recover));
                CHECK_FALSE(exists(reads_path));
                CHECK(exists(run_path));
                CHECK_FALSE(exists(recovered_file_path));
            } else {
                CHECK(exists(path_to_recover));
                CHECK(exists(reads_path));
                CHECK(exists(run_path));
            }
        }
    }

    SECTION("Error messages for problems with combined .pod5.tmp file.")
    {
        remove(path_to_recover);

        SECTION("Recovering set of .tmp files with .pod5.tmp file missing.")
        {
            auto recover_result8 = pod5::recover_file(to_recover, recovered, options);
            REQUIRE_FALSE(recover_result8.ok());
            auto const result_message = recover_result8.status().ToString();
            auto const expected_regex =
                "IOError: Failed to open local file '" + escape_for_regex(to_recover)
                + R"('\. Detail: \[(errno|Windows error) 2\] )"
                + R"((No such file or directory|The system cannot find the file specified)[.\n\r]*)";
            CAPTURE(result_message, expected_regex);
            REQUIRE_THAT(result_message, Catch::Matchers::Matches(expected_regex));
            if (cleanup) {
                CHECK_FALSE(exists(recovered_file_path));
            }
            CHECK_FALSE(exists(path_to_recover));
            CHECK(exists(reads_path));
            CHECK(exists(run_path));
        }

        SECTION("Recovering set of .tmp files with .pod5.tmp file empty.")
        {
            touch(path_to_recover);
            auto recover_result9 = pod5::recover_file(to_recover, recovered, options);
            REQUIRE_FALSE(recover_result9.ok());
            REQUIRE(recover_result9.status().ToString() == "IOError: Invalid signature in file");
            if (cleanup) {
                CHECK_FALSE(exists(recovered_file_path));
                CHECK_FALSE(exists(path_to_recover));
            } else {
                CHECK(exists(path_to_recover));
            }
            CHECK(exists(reads_path));
            CHECK(exists(run_path));
        }

        SECTION("Recovering set of .tmp files with .pod5.tmp file zeroed.")
        {
            write_zeros(path_to_recover);
            auto recover_result10 = pod5::recover_file(to_recover, recovered, options);
            REQUIRE_FALSE(recover_result10.ok());
            REQUIRE(recover_result10.status().ToString() == "IOError: Invalid signature in file");
            if (cleanup) {
                CHECK_FALSE(exists(recovered_file_path));
                CHECK_FALSE(exists(path_to_recover));
            } else {
                CHECK(exists(path_to_recover));
            }
            CHECK(exists(reads_path));
            CHECK(exists(run_path));
        }

        arrow::Result<std::shared_ptr<arrow::io::FileOutputStream>> result_tmp_file =
            arrow::io::FileOutputStream::Open(to_recover, false);
        REQUIRE_ARROW_STATUS_OK(result_tmp_file);
        std::shared_ptr<arrow::io::FileOutputStream> tmp_file = std::move(*result_tmp_file);
        REQUIRE_ARROW_STATUS_OK(pod5::combined_file_utils::write_file_signature(tmp_file));

        SECTION("Recover .pod5.tmp missing section marker after signature.")
        {
            tmp_file = {};
            auto recover_result11 = pod5::recover_file(to_recover, recovered, options);
            REQUIRE_FALSE(recover_result11.ok());
            REQUIRE(recover_result11.status().ToString() == "IOError: Invalid offset into SubFile");
            if (cleanup) {
                CHECK_FALSE(exists(recovered_file_path));
            }
            CHECK(exists(path_to_recover));
            CHECK(exists(reads_path));
            CHECK(exists(run_path));
        }

        SECTION("Recover .pod5.tmp missing signal sub file.")
        {
            pod5::Uuid section_id = uuid_gen();
            REQUIRE_ARROW_STATUS_OK(tmp_file->Write(section_id.data(), section_id.size()));
            tmp_file = {};
            auto recover_result12 = pod5::recover_file(to_recover, recovered, options);
            REQUIRE_FALSE(recover_result12.ok());
            REQUIRE(
                recover_result12.status().ToString()
                == "Invalid: Failed whilst attempting to recover signal data sub file from file - "
                       + to_recover + ". Detail: Not an Arrow file");
            if (cleanup) {
                CHECK_FALSE(exists(recovered_file_path));
            }
            CHECK(exists(path_to_recover));
            CHECK(exists(reads_path));
            CHECK(exists(run_path));
        }
    }
}


================================================
FILE: c++/test/main.cpp
================================================
#define CATCH_CONFIG_MAIN
#include <catch2/catch.hpp>


================================================
FILE: c++/test/output_stream_tests.cpp
================================================
#include "pod5_format/internal/async_output_stream.h"
#include "pod5_format/internal/linux_output_stream.h"
#include "test_utils.h"

#include <arrow/io/file.h>
#include <catch2/catch.hpp>

#include <fstream>
#include <sstream>

namespace {
static constexpr std::size_t TestDataSize = 1024 * 1024 * 100;

std::shared_ptr<arrow::Buffer> get_test_data()
{
    static std::shared_ptr<arrow::Buffer> const data = [] {
        auto result = *arrow::AllocateResizableBuffer(TestDataSize);
        for (std::size_t i = 0; i < TestDataSize; ++i) {
            result->mutable_data()[i] = i % 256;
        }
        return result;
    }();

    return data;
}

std::vector<char> read_file(char const * filename)
{
    std::ifstream fin(filename, std::ios::binary);

    return std::vector<char>(std::istreambuf_iterator<char>(fin), std::istreambuf_iterator<char>());
}

void check_file_contents(char const * filename)
{
    auto contents = read_file(filename);
    auto expected_contents = get_test_data();
    auto expected_contents_span = expected_contents->span_as<char>();

    REQUIRE(contents.size() == expected_contents_span.size());

    for (std::size_t i = 0; i < expected_contents_span.size(); i += 1) {
        CHECK(contents[i] == expected_contents_span[i]);
    }
}
}  // namespace

void run_output_stream_test(std::shared_ptr<arrow::io::OutputStream> output_stream)
{
    auto const data = get_test_data();

    std::size_t small_writes_bytes_consumed = 0;
    {
        CHECK_ARROW_STATUS_OK(output_stream->Write(data->data() + small_writes_bytes_consumed, 1));
        small_writes_bytes_consumed += 1;
        CHECK_ARROW_STATUS_OK(output_stream->Write(data->data() + small_writes_bytes_consumed, 2));
        small_writes_bytes_consumed += 2;
        CHECK_ARROW_STATUS_OK(output_stream->Write(data->data() + small_writes_bytes_consumed, 4));
        small_writes_bytes_consumed += 4;
        CHECK_ARROW_STATUS_OK(output_stream->Write(data->data() + small_writes_bytes_consumed, 8));
        small_writes_bytes_consumed += 8;

        CHECK_ARROW_STATUS_OK(output_stream->Flush());
    }

    auto remaining_data_buffer = arrow::SliceBuffer(data, small_writes_bytes_consumed);

    {
        auto chunk_1 = arrow::SliceBuffer(remaining_data_buffer, 0, 1024);
        auto chunk_2 = arrow::SliceBuffer(remaining_data_buffer, 1024, 63);
        remaining_data_buffer = arrow::SliceBuffer(remaining_data_buffer, 1024 + 63);
        CHECK_ARROW_STATUS_OK(output_stream->Write(chunk_1));
        CHECK_ARROW_STATUS_OK(output_stream->Write(chunk_2));
        CHECK_ARROW_STATUS_OK(output_stream->Flush());
    }

    {
        auto chunk_1 = arrow::SliceBuffer(remaining_data_buffer, 0, 1024 * 1024);
        auto chunk_2 = arrow::SliceBuffer(remaining_data_buffer, 1024 * 1024, 1023);
        remaining_data_buffer = arrow::SliceBuffer(remaining_data_buffer, 1024 * 1024 + 1023);
        CHECK_ARROW_STATUS_OK(output_stream->Write(chunk_1));
        CHECK_ARROW_STATUS_OK(output_stream->Write(chunk_2));
        CHECK_ARROW_STATUS_OK(output_stream->Flush());
    }

    CHECK_ARROW_STATUS_OK(output_stream->Write(remaining_data_buffer));
    CHECK_ARROW_STATUS_OK(output_stream->Flush());
}

TEST_CASE("AsyncOutputStream", "[OutputStream]")
{
    using namespace pod5;

    auto const filename = "./test_file.bin";
    {
        std::ofstream f(filename, std::ios_base::trunc);
    }
    {
        bool keep_file_open = GENERATE(true, false);

        auto thread_pool = make_thread_pool(1);
        auto stream = *AsyncOutputStream::make(
            filename, thread_pool, true, arrow::default_memory_pool(), keep_file_open);

        run_output_stream_test(stream);
    }
    check_file_contents(filename);
}

#ifdef __linux__
TEST_CASE("LinuxOutputStream IOManagerSyncImpl", "[OutputStream]")
{
    using namespace pod5;

    bool keep_file_open = GENERATE(true, false);
    CAPTURE(keep_file_open);

    auto filename = "./test_file.bin";
    {
        std::ofstream f(filename, std::ios_base::trunc);
    }
    {
        auto io_manager = pod5::make_sync_io_manager();
        REQUIRE_ARROW_STATUS_OK(io_manager);
        auto stream = *LinuxOutputStream::make(
            filename, *io_manager, 10 * 1024 * 1024, true, false, true, keep_file_open);

        run_output_stream_test(stream);
    }
    check_file_contents(filename);
}

#endif


================================================
FILE: c++/test/read_table_tests.cpp
================================================
#include "pod5_format/internal/async_output_stream.h"
#include "pod5_format/read_table_reader.h"
#include "pod5_format/read_table_writer.h"
#include "pod5_format/schema_metadata.h"
#include "pod5_format/types.h"
#include "pod5_format/uuid.h"
#include "pod5_format/version.h"
#include "test_utils.h"
#include "utils.h"

#include <arrow/array/array_dict.h>
#include <arrow/array/array_nested.h>
#include <arrow/array/array_primitive.h>
#include <arrow/io/file.h>
#include <arrow/memory_pool.h>
#include <arrow/record_batch.h>
#include <catch2/catch.hpp>

bool operator==(
    std::shared_ptr<arrow::UInt64Array> const & array,
    std::vector<std::uint64_t> const & vec)
{
    auto const length = static_cast<std::size_t>(array->length());
    if (length != vec.size()) {
        return false;
    }

    for (std::size_t i = 0; i < length; ++i) {
        if ((*array)[i] != vec[i]) {
            return false;
        }
    }
    return true;
}

SCENARIO("Read table Tests")
{
    using namespace pod5;

    (void)pod5::register_extension_types();
    auto fin = gsl::finally([] { (void)pod5::unregister_extension_types(); });

    std::mt19937 gen{Catch::rngSeed()};
    auto uuid_gen = pod5::UuidRandomGenerator{gen};

    auto file_identifier = uuid_gen();

    auto data_for_index = [&](std::size_t index) {
        std::array<std::uint8_t, 16> uuid_source{};
        Uuid read_id{uuid_source};

        return std::make_tuple(
            pod5::ReadData{
                read_id,
                std::uint32_t(index * 2),
                std::uint64_t(index * 10),
                std::uint16_t(index + 1),
                std::uint8_t(index + 2),
                0,
                index * 0.1f,
                index * 0.2f,
                index * 100.0f,
                0,
                true,
                0,
                std::uint64_t(index * 150),
                index * 0.4f,
                index * 0.3f,
                index * 0.6f,
                index * 0.5f,
                std::uint32_t(index + 10),
                index * 50.0f,
                index * 0.7f},
            std::vector<std::uint64_t>{index + 2, index + 3});
    };

    GIVEN("A read table writer")
    {
        auto filename = "./foo.pod5";
        auto pool = arrow::system_memory_pool();

        auto const record_batch_count = GENERATE(as<std::size_t>{}, 1, 2, 5, 10);
        auto const read_count = GENERATE(1, 2);

        {
            auto file_out =
                *pod5::AsyncOutputStream::make(filename, pod5::make_thread_pool(1), true);
            auto schema_metadata = make_schema_key_value_metadata(
                {file_identifier, "test_software", *parse_version_number(Pod5Version)});
            REQUIRE_ARROW_STATUS_OK(schema_metadata);

            auto pore_writer = pod5::make_pore_writer(pool);
            REQUIRE_ARROW_STATUS_OK(pore_writer);
            auto end_reason_writer = pod5::make_end_reason_writer(pool);
            REQUIRE_ARROW_STATUS_OK(end_reason_writer);
            auto run_info_writer = pod5::make_run_info_writer(pool);
            REQUIRE_ARROW_STATUS_OK(run_info_writer);

            auto writer = pod5::make_read_table_writer(
                file_out,
                *schema_metadata,
                read_count,
                *pore_writer,
                *end_reason_writer,
                *run_info_writer,
                pool);
            REQUIRE_ARROW_STATUS_OK(writer);

            auto const pore_1 = (*pore_writer)->add("Well Type");
            REQUIRE_ARROW_STATUS_OK(pore_1);
            auto const end_reason_1 = (*end_reason_writer)->lookup(pod5::ReadEndReason::mux_change);
            REQUIRE_ARROW_STATUS_OK(end_reason_1);
            auto const run_info_1 = (*run_info_writer)->add("acq_id_1");
            REQUIRE_ARROW_STATUS_OK(run_info_1);
            auto const run_info_2 = (*run_info_writer)->add("acq_id_2");
            REQUIRE_ARROW_STATUS_OK(run_info_2);

            for (std::size_t i = 0; i < record_batch_count; ++i) {
                for (std::size_t j = 0; j < static_cast<std::size_t>(read_count); ++j) {
                    auto const idx = j + i * read_count;

                    pod5::ReadData read_data;
                    std::vector<std::uint64_t> signal;
                    std::tie(read_data, signal) = data_for_index(idx);
                    auto row = writer->add_read(read_data, signal, signal.size());

                    REQUIRE_ARROW_STATUS_OK(row);
                    CHECK(*row == idx);
                }
            }
            REQUIRE_ARROW_STATUS_OK(writer->close());
        }

        auto file_in = arrow::io::ReadableFile::Open(filename, pool);
        {
            REQUIRE_ARROW_STATUS_OK(file_in);

            auto reader = pod5::make_read_table_reader(*file_in, pool);
            REQUIRE_ARROW_STATUS_OK(reader);

            auto metadata = reader->schema_metadata();
            CHECK(metadata.file_identifier == file_identifier);
            CHECK(metadata.writing_software == "test_software");
            CHECK(metadata.writing_pod5_version == *parse_version_number(Pod5Version));

            REQUIRE(reader->num_record_batches() == record_batch_count);
            for (std::size_t i = 0; i < record_batch_count; ++i) {
                auto const record_batch = reader->read_record_batch(i);
                REQUIRE_ARROW_STATUS_OK(record_batch);
                REQUIRE(record_batch->num_rows() == static_cast<std::size_t>(read_count));

                auto columns = record_batch->columns();

                CHECK(columns->read_id->length() == read_count);
                CHECK(columns->signal->length() == read_count);
                CHECK(columns->channel->length() == read_count);
                CHECK(columns->well->length() == read_count);
                CHECK(columns->pore_type->length() == read_count);
                CHECK(columns->calibration_offset->length() == read_count);
                CHECK(columns->calibration_scale->length() == read_count);
                CHECK(columns->read_number->length() == read_count);
                CHECK(columns->start_sample->length() == read_count);
                CHECK(columns->median_before->length() == read_count);
                CHECK(columns->num_samples->length() == read_count);
                CHECK(columns->end_reason->length() == read_count);
                CHECK(columns->end_reason_forced->length() == read_count);
                CHECK(columns->run_info->length() == read_count);

                auto pore_indices =
                    std::static_pointer_cast<arrow::Int16Array>(columns->pore_type->indices());
                auto end_reason_indices =
                    std::static_pointer_cast<arrow::Int16Array>(columns->end_reason->indices());
                auto run_info_indices =
                    std::static_pointer_cast<arrow::Int16Array>(columns->run_info->indices());
                for (auto j = 0; j < read_count; ++j) {
                    auto idx = j + i * read_count;

                    pod5::ReadData read_data;
                    std::vector<std::uint64_t> expected_signal;
                    std::tie(read_data, expected_signal) = data_for_index(idx);

                    CHECK(columns->read_id->Value(j) == read_data.read_id);

                    auto signal_data = std::static_pointer_cast<arrow::UInt64Array>(
                        columns->signal->value_slice(j));
                    CHECK(
                        gsl::make_span(signal_data->raw_values(), signal_data->length())
                        == gsl::make_span(expected_signal));

                    CHECK(columns->read_number->Value(j) == read_data.read_number);
                    CHECK(columns->start_sample->Value(j) == read_data.start_sample);
                    CHECK(columns->median_before->Value(j) == read_data.median_before);
                    CHECK(columns->num_samples->Value(j) == expected_signal.size());
                    CHECK(columns->calibration_offset->Value(j) == read_data.calibration_offset);
                    CHECK(columns->calibration_scale->Value(j) == read_data.calibration_scale);
                    CHECK(columns->channel->Value(j) == read_data.channel);
                    CHECK(columns->well->Value(j) == read_data.well);

                    CHECK(end_reason_indices->Value(j) == read_data.end_reason);
                    CHECK(pore_indices->Value(j) == read_data.pore_type);
                    CHECK(run_info_indices->Value(j) == read_data.run_info);
                }

                auto pore_data = record_batch->get_pore_type(0);
                REQUIRE_ARROW_STATUS_OK(pore_data);
                CHECK(*pore_data == "Well Type");

                auto end_reason_data = record_batch->get_end_reason(1);
                REQUIRE_ARROW_STATUS_OK(end_reason_data);
                CHECK(end_reason_data->first == pod5::ReadEndReason::mux_change);
                CHECK(end_reason_data->second == "mux_change");

                auto run_info_data = record_batch->get_run_info(0);
                REQUIRE_ARROW_STATUS_OK(run_info_data);
                CHECK(*run_info_data == "acq_id_1");

                run_info_data = record_batch->get_run_info(1);
                REQUIRE_ARROW_STATUS_OK(run_info_data);
                CHECK(*run_info_data == "acq_id_2");
            }
        }
    }
}


================================================
FILE: c++/test/read_table_writer_utils_tests.cpp
================================================
#include "pod5_format/read_table_writer_utils.h"

#include "test_utils.h"
#include "utils.h"

#include <arrow/array/array_binary.h>
#include <arrow/array/array_nested.h>
#include <arrow/array/array_primitive.h>
#include <arrow/memory_pool.h>
#include <catch2/catch.hpp>

TEST_CASE("Run Info Writer Tests")
{
    auto pool = arrow::system_memory_pool();
    auto run_info_writer = pod5::make_run_info_writer(pool);
    REQUIRE_ARROW_STATUS_OK(run_info_writer);

    auto index = (*run_info_writer)->add("acq_id_1");
    CHECK(*index == 0);
    CHECK((*run_info_writer)->item_count() == 1);

    // Important to always call this so we test calling it twice
    auto const value_array = (*run_info_writer)->get_value_array();

    WHEN("Checking the first row")
    {
        REQUIRE_ARROW_STATUS_OK(value_array);

        auto string_value_array = std::dynamic_pointer_cast<arrow::StringArray>(*value_array);
        REQUIRE(string_value_array);

        CHECK(string_value_array->length() == 1);
        CHECK(string_value_array->Value(0) == "acq_id_1");
    }

    index = (*run_info_writer)->add("acq_id_2");
    CHECK(*index == 1);
    CHECK((*run_info_writer)->item_count() == 2);

    WHEN("Checking the rows after a second append")
    {
        auto value_array = (*run_info_writer)->get_value_array();
        REQUIRE_ARROW_STATUS_OK(value_array);

        auto string_value_array = std::dynamic_pointer_cast<arrow::StringArray>(*value_array);
        REQUIRE(string_value_array);

        CHECK(string_value_array->length() == 2);
        CHECK(string_value_array->Value(0) == "acq_id_1");
        CHECK(string_value_array->Value(1) == "acq_id_2");
    }
}


================================================
FILE: c++/test/run_info_table_tests.cpp
================================================
#include "pod5_format/internal/async_output_stream.h"
#include "pod5_format/run_info_table_reader.h"
#include "pod5_format/run_info_table_writer.h"
#include "pod5_format/schema_metadata.h"
#include "pod5_format/types.h"
#include "pod5_format/uuid.h"
#include "pod5_format/version.h"
#include "test_utils.h"
#include "utils.h"

#include <arrow/array/array_dict.h>
#include <arrow/array/array_nested.h>
#include <arrow/array/array_primitive.h>
#include <arrow/io/file.h>
#include <arrow/memory_pool.h>
#include <arrow/record_batch.h>
#include <catch2/catch.hpp>

SCENARIO("Run Info table Tests")
{
    using namespace pod5;

    (void)pod5::register_extension_types();
    auto fin = gsl::finally([] { (void)pod5::unregister_extension_types(); });

    std::mt19937 gen{Catch::rngSeed()};
    auto uuid_gen = pod5::UuidRandomGenerator{gen};

    auto file_identifier = uuid_gen();

    GIVEN("A read table writer")
    {
        auto filename = "./foo.pod5";
        auto pool = arrow::system_memory_pool();

        auto run_info_data_0 = get_test_run_info_data();
        auto run_info_data_1 = get_test_run_info_data("_2");

        {
            auto file_out =
                *pod5::AsyncOutputStream::make(filename, pod5::make_thread_pool(1), true);
            auto schema_metadata = make_schema_key_value_metadata(
                {file_identifier, "test_software", *parse_version_number(Pod5Version)});
            REQUIRE_ARROW_STATUS_OK(schema_metadata);

            std::size_t run_info_per_batch = 2;

            auto writer = pod5::make_run_info_table_writer(
                file_out, *schema_metadata, run_info_per_batch, pool);
            REQUIRE_ARROW_STATUS_OK(writer);

            REQUIRE_ARROW_STATUS_OK(writer->add_run_info(run_info_data_0));
            REQUIRE_ARROW_STATUS_OK(writer->add_run_info(run_info_data_1));
        }

        auto file_in = arrow::io::ReadableFile::Open(filename, pool);
        {
            REQUIRE_ARROW_STATUS_OK(file_in);

            auto reader = pod5::make_run_info_table_reader(*file_in, pool);
            REQUIRE_ARROW_STATUS_OK(reader);

            auto metadata = reader->schema_metadata();
            CHECK(metadata.file_identifier == file_identifier);
            CHECK(metadata.writing_software == "test_software");
            CHECK(metadata.writing_pod5_version == *parse_version_number(Pod5Version));

            REQUIRE(reader->num_record_batches() == 1);
            auto const record_batch = reader->read_record_batch(0);
            REQUIRE_ARROW_STATUS_OK(record_batch);
            REQUIRE(record_batch->num_rows() == 2);

            auto columns = record_batch->columns();
            REQUIRE_ARROW_STATUS_OK(columns);

            auto check_run_info = [](auto & columns,
                                     std::size_t index,
                                     pod5::RunInfoData const & run_info_data) {
                CHECK(columns.acquisition_id->Value(index) == run_info_data.acquisition_id);

                CHECK(
                    columns.acquisition_start_time->Value(index)
                    == run_info_data.acquisition_start_time);
                CHECK(columns.adc_max->Value(index) == run_info_data.adc_max);
                CHECK(columns.adc_min->Value(index) == run_info_data.adc_min);
                CHECK(columns.experiment_name->Value(index) == run_info_data.experiment_name);
                CHECK(columns.flow_cell_id->Value(index) == run_info_data.flow_cell_id);
                CHECK(
                    columns.flow_cell_product_code->Value(index)
                    == run_info_data.flow_cell_product_code);
                CHECK(columns.protocol_name->Value(index) == run_info_data.protocol_name);
                CHECK(columns.protocol_run_id->Value(index) == run_info_data.protocol_run_id);
                CHECK(
                    columns.protocol_start_time->Value(index) == run_info_data.protocol_start_time);
                CHECK(columns.sample_id->Value(index) == run_info_data.sample_id);
                CHECK(columns.sample_rate->Value(index) == run_info_data.sample_rate);
                CHECK(columns.sequencing_kit->Value(index) == run_info_data.sequencing_kit);
                CHECK(columns.sequencer_position->Value(index) == run_info_data.sequencer_position);
                CHECK(
                    columns.sequencer_position_type->Value(index)
                    == run_info_data.sequencer_position_type);
                CHECK(columns.software->Value(index) == run_info_data.software);
                CHECK(columns.system_name->Value(index) == run_info_data.system_name);
                CHECK(columns.system_type->Value(index) == run_info_data.system_type);
            };

            check_run_info(*columns, 0, run_info_data_0);
            check_run_info(*columns, 1, run_info_data_1);

            auto found_run_info_0 = reader->find_run_info(run_info_data_0.acquisition_id);
            CHECK_ARROW_STATUS_OK(found_run_info_0);
            CHECK(**found_run_info_0 == run_info_data_0);

            auto found_run_info_1 = reader->find_run_info(run_info_data_1.acquisition_id);
            CHECK_ARROW_STATUS_OK(found_run_info_1);
            CHECK(**found_run_info_1 == run_info_data_1);
        }
    }
}


================================================
FILE: c++/test/schema_tests.cpp
================================================
#include "pod5_format/schema_metadata.h"
#include "test_utils.h"

#include <catch2/catch.hpp>

SCENARIO("Version Tests")
{
    using namespace pod5;

    CHECK(Version(1, 2, 3) < Version(3, 2, 1));
    CHECK(Version(1, 2, 3) < Version(1, 3, 3));
    CHECK(Version(1, 2, 3) < Version(1, 2, 4));

    CHECK(Version(3, 2, 1) > Version(1, 2, 3));
    CHECK(Version(1, 3, 3) > Version(1, 2, 3));
    CHECK(Version(1, 2, 4) > Version(1, 2, 3));

    CHECK(Version(1, 2, 3) == Version(1, 2, 3));

    CHECK(Version(1, 2, 3) != Version(2, 2, 3));
    CHECK(Version(1, 2, 3) != Version(1, 3, 3));
    CHECK(Version(1, 2, 3) != Version(1, 2, 4));

    CHECK_ARROW_STATUS_NOT_OK(parse_version_number("1.2.3.4"));
    CHECK_ARROW_STATUS_NOT_OK(parse_version_number("1.2.3-pre"));

    auto const parsed_version = parse_version_number("10.200.3");
    REQUIRE_ARROW_STATUS_OK(parsed_version);
    CHECK(Version(10, 200, 3) == *parsed_version);
    CHECK(parsed_version->major_version() == 10);
    CHECK(parsed_version->minor_version() == 200);
    CHECK(parsed_version->revision_version() == 3);

    CHECK(Version(1, 200, 30).to_string() == "1.200.30");
}


================================================
FILE: c++/test/signal_compression_tests.cpp
================================================
#include "pod5_format/signal_compression.h"

#include "test_utils.h"
#include "utils.h"

#include <arrow/buffer.h>
#include <arrow/memory_pool.h>
#include <catch2/catch.hpp>
#include <gsl/gsl-lite.hpp>

#include <numeric>

SCENARIO("Signal compression Tests")
{
    auto pool = arrow::system_memory_pool();

    std::vector<std::int16_t> signal(100'00);
    std::iota(signal.begin(), signal.end(), 0);

    auto compressed = pod5::compress_signal(gsl::make_span(signal), pool);
    REQUIRE_ARROW_STATUS_OK(compressed);
    auto compressed_span = gsl::make_span((*compressed)->data(), (*compressed)->size());

    auto decompressed = pod5::decompress_signal(compressed_span, signal.size(), pool);
    REQUIRE_ARROW_STATUS_OK(decompressed);
    auto decompressed_span = gsl::make_span((*decompressed)->data(), (*decompressed)->size())
                                 .as_span<std::int16_t const>();

    CHECK(gsl::make_span(signal) == decompressed_span);
}


================================================
FILE: c++/test/signal_table_tests.cpp
================================================
#include "pod5_format/internal/async_output_stream.h"
#include "pod5_format/schema_metadata.h"
#include "pod5_format/signal_compression.h"
#include "pod5_format/signal_table_reader.h"
#include "pod5_format/signal_table_writer.h"
#include "pod5_format/types.h"
#include "pod5_format/uuid.h"
#include "pod5_format/version.h"
#include "test_utils.h"
#include "utils.h"

#include <arrow/array/array_nested.h>
#include <arrow/array/array_primitive.h>
#include <arrow/io/file.h>
#include <arrow/memory_pool.h>
#include <arrow/record_batch.h>
#include <catch2/catch.hpp>

#include <numeric>

SCENARIO("Signal table Tests")
{
    using namespace pod5;

    (void)pod5::register_extension_types();
    auto fin = gsl::finally([] { (void)pod5::unregister_extension_types(); });

    std::mt19937 gen{Catch::rngSeed()};
    auto uuid_gen = pod5::UuidRandomGenerator{gen};

    auto file_identifier = uuid_gen();

    auto read_id_1 = uuid_gen();
    auto read_id_2 = uuid_gen();
    std::vector<std::int16_t> signal_1(100'000);
    std::iota(signal_1.begin(), signal_1.end(), 0);
    std::vector<std::int16_t> signal_2(10'000, 1);

    GIVEN("A signal table writer")
    {
        auto filename = "./foo.pod5";
        auto pool = arrow::system_memory_pool();

        auto signal_type = GENERATE(SignalType::UncompressedSignal, SignalType::VbzSignal);

        {
            auto file_out =
                *pod5::AsyncOutputStream::make(filename, pod5::make_thread_pool(1), true);
            auto schema_metadata = make_schema_key_value_metadata(
                {file_identifier, "test_software", *parse_version_number(Pod5Version)});
            REQUIRE_ARROW_STATUS_OK(schema_metadata);

            auto writer =
                pod5::make_signal_table_writer(file_out, *schema_metadata, 100, signal_type, pool);
            REQUIRE_ARROW_STATUS_OK(writer);

            WHEN("Writing a read")
            {
                auto row_1 = writer->add_signal(read_id_1, gsl::make_span(signal_1));

                auto row_2 = writer->add_signal(read_id_2, gsl::make_span(signal_2));

                REQUIRE_ARROW_STATUS_OK(writer->close());

                THEN("Read row ids are correct")
                {
                    REQUIRE_ARROW_STATUS_OK(row_1);
                    REQUIRE_ARROW_STATUS_OK(row_2);
                    CHECK(*row_1 == 0);
                    CHECK(*row_2 == 1);
                }
            }
        }

        auto file_in = arrow::io::ReadableFile::Open(filename, pool);
        {
            REQUIRE_ARROW_STATUS_OK(file_in);

            auto reader = pod5::make_signal_table_reader(*file_in, 20, pool);
            CAPTURE(reader);
            REQUIRE_ARROW_STATUS_OK(reader);

            auto metadata = reader->schema_metadata();
            CHECK(metadata.file_identifier == file_identifier);
            CHECK(metadata.writing_software == "test_software");
            CHECK(metadata.writing_pod5_version == *parse_version_number(Pod5Version));

            REQUIRE(reader->num_record_batches() == 1);
            auto const record_batch_0 = reader->read_record_batch(0);
            REQUIRE_ARROW_STATUS_OK(record_batch_0);
            REQUIRE(record_batch_0->num_rows() == 2);

            auto read_id = record_batch_0->read_id_column();
            CHECK(read_id->length() == 2);
            CHECK(read_id->Value(0) == read_id_1);
            CHECK(read_id->Value(1) == read_id_2);

            if (signal_type == SignalType::VbzSignal) {
                auto signal = record_batch_0->vbz_signal_column();
                CHECK(signal->length() == 2);

                auto compare_compressed_signal =
                    [&](gsl::span<std::uint8_t const> compressed_actual,
                        std::vector<std::int16_t> const & expected) {
                        auto decompressed =
                            pod5::decompress_signal(compressed_actual, expected.size(), pool);
                        REQUIRE_ARROW_STATUS_OK(decompressed);

                        auto actual =
                            gsl::make_span((*decompressed)->data(), (*decompressed)->size())
                                .as_span<std::int16_t const>();
                        CHECK(actual == gsl::make_span(expected));
                    };

                auto signal_typed = std::static_pointer_cast<VbzSignalArray>(signal);
                compare_compressed_signal(signal_typed->Value(0), signal_1);
                compare_compressed_signal(signal_typed->Value(1), signal_2);
            } else if (signal_type == SignalType::UncompressedSignal) {
                auto signal = record_batch_0->uncompressed_signal_column();
                CHECK(signal->length() == 2);

                auto signal_1_read =
                    std::static_pointer_cast<arrow::Int16Array>(signal->value_slice(0));
                std::vector<std::int16_t> stored_values_1(
                    signal_1_read->raw_values(),
                    signal_1_read->raw_values() + signal_1_read->length());
                CHECK(stored_values_1 == signal_1);
                auto signal_2_read =
                    std::static_pointer_cast<arrow::Int16Array>(signal->value_slice(1));
                std::vector<std::int16_t> stored_values_2(
                    signal_2_read->raw_values(),
                    signal_2_read->raw_values() + signal_2_read->length());
                CHECK(stored_values_2 == signal_2);
            } else {
                FAIL("Unknown signal type");
            }

            auto samples = record_batch_0->samples_column();
            CHECK(samples->length() == 2);
            CHECK(samples->Value(0) == signal_1.size());
            CHECK(samples->Value(1) == signal_2.size());
        }
    }
}


================================================
FILE: c++/test/svb16_scalar_tests.cpp
================================================
#include "pod5_format/svb16/decode.hpp"
#include "pod5_format/svb16/encode.hpp"

#include <catch2/catch.hpp>

#include <algorithm>
#include <cstdint>
#include <limits>
#include <random>
#include <vector>

using Catch::Matchers::Equals;

template <typename Int16T, bool UseDelta, bool UseZigzag>
void test_scalar_encode_scalar_decode()
{
    static constexpr uint32_t DATA_COUNT = 1024;
    std::minstd_rand rng;

    std::vector<Int16T> data(DATA_COUNT);
    std::uniform_int_distribution<Int16T> dist{
        std::numeric_limits<Int16T>::min(), std::numeric_limits<Int16T>::max()};
    std::generate(data.begin(), data.end(), [&] { return dist(rng); });

    std::vector<uint8_t> encoded(svb16_max_encoded_length(data.size()));
    auto const encoded_count =
        svb16::encode_scalar<Int16T, UseDelta, UseZigzag>(
            data.data(), encoded.data(), encoded.data() + svb16_key_length(data.size()), DATA_COUNT)
        - encoded.data();

    CHECK(encoded_count <= svb16_max_encoded_length(data.size()));

    std::vector<Int16T> decoded(DATA_COUNT);
    auto const encoded_span = gsl::make_span(encoded);
    auto const key_length = svb16_key_length(data.size());
    auto const consumed = svb16::decode_scalar<Int16T, UseDelta, UseZigzag>(
                              gsl::make_span(decoded),
                              encoded_span.subspan(0, key_length),
                              encoded_span.subspan(key_length))
                          - encoded.data();

    CHECK(consumed == encoded_count);

    CHECK_THAT(decoded, Equals(data));
}

TEST_CASE("Scalar decode is inverse of scalar encode", "[scalar]")
{
    SECTION("Unsigned, no delta, no zig-zag")
    {
        test_scalar_encode_scalar_decode<uint16_t, false, false>();
    }
    SECTION("Signed, no delta, no zig-zag")
    {
        test_scalar_encode_scalar_decode<int16_t, false, false>();
    }
    SECTION("Unsigned, delta, no zig-zag")
    {
        test_scalar_encode_scalar_decode<uint16_t, true, false>();
    }
    SECTION("Signed, delta, no zig-zag")
    {
        test_scalar_encode_scalar_decode<int16_t, true, false>();
    }
    SECTION("Unsigned, delta, zig-zag")
    {
        test_scalar_encode_scalar_decode<uint16_t, true, true>();
    }
    SECTION("Signed, delta, zig-zag") { test_scalar_encode_scalar_decode<int16_t, true, true>(); }
    SECTION("Unsigned, no delta, zig-zag")
    {
        // this scenario doesn't really make sense, but it's possible, so let's test it
        test_scalar_encode_scalar_decode<uint16_t, false, true>();
    }
    SECTION("Signed, no delta, zig-zag")
    {
        test_scalar_encode_scalar_decode<int16_t, false, true>();
    }
}


================================================
FILE: c++/test/svb16_x64_tests.cpp
================================================
#include "pod5_format/svb16/decode.hpp"
#include "pod5_format/svb16/encode.hpp"

#include <catch2/catch.hpp>

#include <algorithm>
#include <cstdint>
#include <limits>
#include <numeric>
#include <random>
#include <vector>

#ifdef SVB16_X64

using Catch::Matchers::Equals;

template <typename Int16T, bool UseDelta, bool UseZigzag>
void test_sse_encode_scalar_decode()
{
    uint32_t const DATA_COUNT = GENERATE(
        1000,
        20000);  // Deliberately not aligned to 64 so we test the scalar tidy up code at the end.
    std::minstd_rand rng;
    std::vector<Int16T> data(DATA_COUNT);
    std::uniform_int_distribution<Int16T> dist{
        std::numeric_limits<Int16T>::min(), std::numeric_limits<Int16T>::max()};
    std::generate(data.begin(), data.end(), [&] { return dist(rng); });

    std::vector<uint8_t> encoded(svb16_max_encoded_length(data.size()));
    auto const encoded_count =
        svb16::encode_sse<Int16T, UseDelta, UseZigzag>(
            data.data(), encoded.data(), encoded.data() + svb16_key_length(data.size()), DATA_COUNT)
        - encoded.data();

    CHECK(encoded_count <= svb16_max_encoded_length(data.size()));

    std::vector<uint8_t> encoded_scalar(svb16_max_encoded_length(data.size()));
    auto const scalar_encoded_count = svb16::encode_scalar<Int16T, UseDelta, UseZigzag>(
                                          data.data(),
                                          encoded_scalar.data(),
                                          encoded_scalar.data() + svb16_key_length(data.size()),
                                          DATA_COUNT)
                                      - encoded_scalar.data();
    CHECK(scalar_encoded_count == encoded_count);
    CHECK(encoded == encoded_scalar);

    std::vector<Int16T> decoded(DATA_COUNT);
    auto const encoded_span = gsl::make_span(encoded);
    auto const key_length = svb16_key_length(data.size());
    auto const consumed = svb16::decode_sse<Int16T, UseDelta, UseZigzag>(
                              gsl::make_span(decoded),
                              encoded_span.subspan(0, key_length),
                              encoded_span.subspan(key_length))
                          - encoded.data();

    CHECK(consumed == encoded_count);

    CHECK_THAT(decoded, Equals(data));
}

TEST_CASE("SSE decode is inverse of scalar encode", "[scalar]")
{
    SECTION("Unsigned, no delta, no zig-zag")
    {
        test_sse_encode_scalar_decode<uint16_t, false, false>();
    }
    SECTION("Signed, no delta, no zig-zag")
    {
        test_sse_encode_scalar_decode<int16_t, false, false>();
    }
    SECTION("Unsigned, delta, no zig-zag")
    {
        test_sse_encode_scalar_decode<uint16_t, true, false>();
    }
    SECTION("Signed, delta, no zig-zag") { test_sse_encode_scalar_decode<int16_t, true, false>(); }
    SECTION("Unsigned, delta, zig-zag") { test_sse_encode_scalar_decode<uint16_t, true, true>(); }
    SECTION("Signed, delta, zig-zag") { test_sse_encode_scalar_decode<int16_t, true, true>(); }
    SECTION("Unsigned, no delta, zig-zag")
    {
        // this scenario doesn't really make sense, but it's possible, so let's test it
        test_sse_encode_scalar_decode<uint16_t, false, true>();
    }
    SECTION("Signed, no delta, zig-zag") { test_sse_encode_scalar_decode<int16_t, false, true>(); }
}

#endif


================================================
FILE: c++/test/test_utils.h
================================================
#pragma once

#include <arrow/result.h>
#include <arrow/status.h>
#include <catch2/catch.hpp>

template <typename T>
struct Catch::StringMaker<arrow::Result<T>> {
    static std::string convert(arrow::Result<T> const & value) { return value.status().ToString(); }
};

template <bool CheckOk>
class IsStatusOk : public Catch::MatcherBase<arrow::Status> {
public:
    IsStatusOk() = default;

    bool match(arrow::Status const & status) const override { return status.ok() == CheckOk; }

    virtual std::string describe() const override { return "== arrow::Status::OK()"; }
};

template <bool CheckOk, typename T>
class IsResultOk : public Catch::MatcherBase<arrow::Result<T>> {
public:
    IsResultOk() = default;

    bool match(arrow::Result<T> const & status) const override { return status.ok() == CheckOk; }

    virtual std::string describe() const override { return "== arrow::Status::OK()"; }
};

template <typename T>
inline IsResultOk<true, T> _is_arrow_ok(arrow::Result<T> const &)
{
    return IsResultOk<true, T>();
}

inline IsStatusOk<true> _is_arrow_ok(arrow::Status const &) { return IsStatusOk<true>(); }

template <typename T>
inline IsResultOk<false, T> _is_arrow_not_ok(arrow::Result<T> const &)
{
    return IsResultOk<false, T>();
}

inline IsStatusOk<false> _is_arrow_not_ok(arrow::Status const &) { return IsStatusOk<false>(); }

#define CHECK_ARROW_STATUS_OK(statement)      \
    do {                                      \
        auto const & _res = (statement);      \
        CHECK_THAT(_res, _is_arrow_ok(_res)); \
    } while (false)

#define REQUIRE_ARROW_STATUS_OK(statement)      \
    do {                                        \
        auto const & _res = (statement);        \
        REQUIRE_THAT(_res, _is_arrow_ok(_res)); \
    } while (false)

#define CHECK_ARROW_STATUS_NOT_OK(statement)      \
    do {                                          \
        auto const & _res = (statement);          \
        CHECK_THAT(_res, _is_arrow_not_ok(_res)); \
    } while (false)

#define REQUIRE_ARROW_STATUS_NOT_OK(statement)      \
    do {                                            \
        auto const & _res = (statement);            \
        REQUIRE_THAT(_res, _is_arrow_not_ok(_res)); \
    } while (false)


================================================
FILE: c++/test/thread_pool_tests.cpp
================================================
#include "pod5_format/thread_pool.h"

#include <catch2/catch.hpp>

#include <condition_variable>
#include <mutex>
#include <thread>
#include <vector>

TEST_CASE("Thread pool runs tasks concurrently", "[thread_pool]")
{
    using namespace std::chrono_literals;

    auto const explicit_stop = GENERATE(true, false);
    CAPTURE(explicit_stop);

    auto const use_strands = GENERATE(true, false);
    CAPTURE(use_strands);

    // semaphores only in std lib in c++20, so fake them
    std::mutex sem_mutex;
    int sem1 = 2;
    std::condition_variable cv1;
    int sem2 = 2;
    std::condition_variable cv2;

    auto const create_task = [&]() -> std::function<void()> {
        return [&] {
            std::unique_lock<std::mutex> l{sem_mutex};
            sem1--;
            if (sem1 > 0) {
                cv1.wait(l, [&] { return sem1 == 0; });
            } else {
                l.unlock();
                cv1.notify_all();
                std::this_thread::sleep_for(1ms);
                l.lock();
            }

            sem2--;
            if (sem2 > 0) {
                cv2.wait(l, [&] { return sem2 == 0; });
            } else {
                l.unlock();
                cv2.notify_all();
            }
        };
    };

    auto thread_pool = pod5::make_thread_pool(2);
    std::shared_ptr<pod5::ThreadPoolStrand> strands[2];
    if (use_strands) {
        for (unsigned i = 0; i < 2; ++i) {
            strands[i] = thread_pool->create_strand();
            strands[i]->post(create_task());
        }
    } else {
        thread_pool->post(create_task());
        thread_pool->post(create_task());
    }

    if (explicit_stop) {
        thread_pool->stop_and_drain();
    } else {
        thread_pool.reset();
        for (unsigned i = 0; i < 2; ++i) {
            strands[i].reset();
        }
    }

    REQUIRE(sem1 == 0);
    REQUIRE(sem2 == 0);
}

TEST_CASE("Tasks on the same strand are serialised", "[thread_pool]")
{
    using namespace std::chrono_literals;

    auto const explicit_stop = GENERATE(true, false);
    CAPTURE(explicit_stop);

    std::mutex seq_mutex;
    std::vector<int> seq;
    seq.reserve(4);

    auto const create_task = [&](int const num) -> std::function<void()> {
        return [&, num] {
            {
                std::lock_guard<std::mutex> l{seq_mutex};
                seq.push_back(num);
            }
            std::this_thread::sleep_for(50ms);
            {
                std::lock_guard<std::mutex> l{seq_mutex};
                seq.push_back(num);
            }
        };
    };

    auto thread_pool = pod5::make_thread_pool(2);
    auto strand = thread_pool->create_strand();
    strand->post(create_task(0));
    strand->post(create_task(1));

    if (explicit_stop) {
        thread_pool->stop_and_drain();
    } else {
        thread_pool.reset();
        strand.reset();
    }

    REQUIRE(seq.size() == 4);
    if (seq[0] == 0) {
        REQUIRE(seq == (std::vector<int>{0, 0, 1, 1}));
    } else {
        REQUIRE(seq == (std::vector<int>{1, 1, 0, 0}));
    }
}


================================================
FILE: c++/test/utils.h
================================================
#pragma once

#include "pod5_format/read_table_utils.h"
#include "test_utils.h"

#include <arrow/result.h>
#include <arrow/util/io_util.h>

inline pod5::RunInfoData get_test_run_info_data(
    std::string suffix = "",
    std::int16_t adc_center_offset = 0,
    std::int16_t sample_rate = 4000)
{
    return pod5::RunInfoData(
        "acquisition_id" + suffix,
        1005,
        4095 + adc_center_offset,
        -4096 + adc_center_offset,
        {{"context" + suffix, "tags" + suffix},
         {"other" + suffix, "tagz" + suffix},
         {"third" + suffix, "thing" + suffix}},
        "experiment_name" + suffix,
        "flow_cell_id" + suffix,
        "flow_cell_product_code" + suffix,
        "protocol_name" + suffix,
        "protocol_run_id" + suffix,
        200005,
        "sample_id" + suffix,
        sample_rate,
        "sequencing_kit" + suffix,
        "sequencer_position" + suffix,
        "sequencer_position_type" + suffix,
        "software" + suffix,
        "system_name" + suffix,
        "system_type" + suffix,
        {{"tracking" + suffix, "id" + suffix}});
}

inline arrow::Status remove_file_if_exists(std::string const & file)
{
    ARROW_ASSIGN_OR_RAISE(
        auto arrow_reads_path, ::arrow::internal::PlatformFilename::FromString(file));
    ARROW_ASSIGN_OR_RAISE(bool file_exists, arrow::internal::FileExists(arrow_reads_path));
    if (file_exists) {
        ARROW_RETURN_NOT_OK(arrow::internal::DeleteFile(arrow_reads_path));
    }
    return arrow::Status::OK();
}


================================================
FILE: c++/test/uuid_tests.cpp
================================================
// This file contains code from https://github.com/mariusbancila/stduuid/ which has the following
// license:
//
//   MIT License
//
//   Copyright (c) 2017
//
//   Permission is hereby granted, free of charge, to any person obtaining a copy
//   of this software and associated documentation files (the "Software"), to deal
//   in the Software without restriction, including without limitation the rights
//   to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
//   copies of the Software, and to permit persons to whom the Software is
//   furnished to do so, subject to the following conditions:
//
//   The above copyright notice and this permission notice shall be included in all
//   copies or substantial portions of the Software.
//
//   THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
//   IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
//   FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
//   AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
//   LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
//   OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
//   SOFTWARE.

#include "pod5_format/uuid.h"

#include <catch2/catch.hpp>

#include <set>
#include <unordered_set>

TEST_CASE("Default constructor returns nil UUID", "[pod5::Uuid]")
{
    pod5::Uuid nil;
    REQUIRE(nil.is_nil());
}

TEST_CASE("Default constructor produces all-zero string", "[pod5::Uuid]")
{
    pod5::Uuid nil;
    REQUIRE(to_string(nil) == "00000000-0000-0000-0000-000000000000");
    REQUIRE(pod5::to_string<wchar_t>(nil) == L"00000000-0000-0000-0000-000000000000");
}

TEST_CASE("Parsing the nil UUID is nil", "[pod5::Uuid]")
{
    auto const no_braces = pod5::Uuid::from_string("00000000-0000-0000-0000-000000000000");
    auto const braces = pod5::Uuid::from_string("{00000000-0000-0000-0000-000000000000}");
    auto const no_braces_w = pod5::Uuid::from_string(L"00000000-0000-0000-0000-000000000000");
    auto const braces_w = pod5::Uuid::from_string(L"{00000000-0000-0000-0000-000000000000}");

    REQUIRE(no_braces);
    REQUIRE(no_braces->is_nil());
    REQUIRE(braces);
    REQUIRE(braces->is_nil());
    REQUIRE(no_braces_w);
    REQUIRE(no_braces_w->is_nil());
    REQUIRE(braces_w);
    REQUIRE(braces_w->is_nil());
}

TEST_CASE("Parsing produces the same value with or without braces", "[pod5::Uuid]")
{
    auto const no_braces = pod5::Uuid::from_string("1d5a3dd9-2d50-4f2b-a0fb-a3a749eb96c7");
    auto const braces = pod5::Uuid::from_string("{1d5a3dd9-2d50-4f2b-a0fb-a3a749eb96c7}");
    auto const no_braces_w = pod5::Uuid::from_string(L"1d5a3dd9-2d50-4f2b-a0fb-a3a749eb96c7");
    auto const braces_w = pod5::Uuid::from_string(L"{1d5a3dd9-2d50-4f2b-a0fb-a3a749eb96c7}");

    REQUIRE(no_braces == braces);
    REQUIRE(no_braces_w == braces_w);
}

TEST_CASE("Parsing produces the same value from char or wchar_t", "[pod5::Uuid]")
{
    auto const no_braces = pod5::Uuid::from_string("1d5a3dd9-2d50-4f2b-a0fb-a3a749eb96c7");
    auto const braces = pod5::Uuid::from_string("{1d5a3dd9-2d50-4f2b-a0fb-a3a749eb96c7}");
    auto const no_braces_w = pod5::Uuid::from_string(L"1d5a3dd9-2d50-4f2b-a0fb-a3a749eb96c7");
    auto const braces_w = pod5::Uuid::from_string(L"{1d5a3dd9-2d50-4f2b-a0fb-a3a749eb96c7}");

    REQUIRE(no_braces == no_braces_w);
    REQUIRE(braces == braces_w);
}

TEST_CASE("A parsed UUID prints the same value", "[pod5::Uuid]")
{
    auto const guid = pod5::Uuid::from_string("1d5a3dd9-2d50-4f2b-a0fb-a3a749eb96c7");
    REQUIRE(guid);
    REQUIRE(to_string(*guid) == "1d5a3dd9-2d50-4f2b-a0fb-a3a749eb96c7");
    REQUIRE(pod5::to_string<wchar_t>(*guid) == L"1d5a3dd9-2d50-4f2b-a0fb-a3a749eb96c7");
}

TEST_CASE("Invalid UUIDs cannot be parsed", "[pod5::Uuid]")
{
    REQUIRE_FALSE(pod5::Uuid::from_string(""));
    REQUIRE_FALSE(pod5::Uuid::from_string("{}"));
    // mismatched braces
    REQUIRE_FALSE(pod5::Uuid::from_string("{1d5a3dd9-2d50-4f2b-a0fb-a3a749eb96c7"));
    REQUIRE_FALSE(pod5::Uuid::from_string("1d5a3dd9-2d50-4f2b-a0fb-a3a749eb96c7}"));
    // missing a char
    REQUIRE_FALSE(pod5::Uuid::from_string("1d5a3dd9-2d50-4f2b-a0fb-a3a749eb96c"));
    // too many chars
    REQUIRE_FALSE(pod5::Uuid::from_string("1d5a3dd9-2d50-4f2b-a0fb-a3a749eb96c77"));
    // invalid characters
    REQUIRE_FALSE(pod5::Uuid::from_string("1d5a3dd9-2d50-4f2b-a0fb-a3a749eb96cg"));
}

TEST_CASE("Construction from iterators", "[pod5::Uuid]")
{
    using namespace std::string_literals;

    {
        std::array<uint8_t, 16> const arr{
            {0x47,
             0x18,
             0x38,
             0x23,
             0x25,
             0x74,
             0x4b,
             0xfd,
             0xb4,
             0x11,
             0x99,
             0xed,
             0x17,
             0x7d,
             0x3e,
             0x43}};

        pod5::Uuid guid(arr.begin(), arr.end());
        REQUIRE(to_string(guid) == "47183823-2574-4bfd-b411-99ed177d3e43"s);
    }

    {
        uint8_t const arr[16] = {
            0x47,
            0x18,
            0x38,
            0x23,
            0x25,
            0x74,
            0x4b,
            0xfd,
            0xb4,
            0x11,
            0x99,
            0xed,
            0x17,
            0x7d,
            0x3e,
            0x43};

        pod5::Uuid guid(std::begin(arr), std::end(arr));
        REQUIRE(to_string(guid) == "47183823-2574-4bfd-b411-99ed177d3e43"s);
    }
}

TEST_CASE("Construction from arrays", "[pod5::Uuid]")
{
    using namespace std::string_literals;

    {
        pod5::Uuid guid{
            {0x47,
             0x18,
             0x38,
             0x23,
             0x25,
             0x74,
             0x4b,
             0xfd,
             0xb4,
             0x11,
             0x99,
             0xed,
             0x17,
             0x7d,
             0x3e,
             0x43}};

        REQUIRE(to_string(guid) == "47183823-2574-4bfd-b411-99ed177d3e43"s);
    }

    {
        std::array<uint8_t, 16> const arr{
            {0x47,
             0x18,
             0x38,
             0x23,
             0x25,
             0x74,
             0x4b,
             0xfd,
             0xb4,
             0x11,
             0x99,
             0xed,
             0x17,
             0x7d,
             0x3e,
             0x43}};

        pod5::Uuid guid(arr);
        REQUIRE(to_string(guid) == "47183823-2574-4bfd-b411-99ed177d3e43"s);
    }

    {
        uint8_t const arr[16] = {
            0x47,
            0x18,
            0x38,
            0x23,
            0x25,
            0x74,
            0x4b,
            0xfd,
            0xb4,
            0x11,
            0x99,
            0xed,
            0x17,
            0x7d,
            0x3e,
            0x43};

        pod5::Uuid guid(arr);
        REQUIRE(to_string(guid) == "47183823-2574-4bfd-b411-99ed177d3e43"s);
    }
}

TEST_CASE("Test equality", "[operators]")
{
    pod5::Uuid empty;

    auto engine = pod5::UuidRandomGenerator::engine_type{Catch::rngSeed()};
    pod5::Uuid guid = pod5::UuidRandomGenerator{engine}();

    REQUIRE(empty == empty);
    REQUIRE(guid == guid);
    REQUIRE(empty != guid);
}

TEST_CASE("Test comparison", "[operators]")
{
    auto empty = pod5::Uuid{};

    auto engine = pod5::UuidRandomGenerator::engine_type{Catch::rngSeed()};

    pod5::UuidRandomGenerator gen{engine};
    auto id = gen();

    REQUIRE(empty < id);

    std::set<pod5::Uuid> ids{pod5::Uuid{}, gen(), gen(), gen(), gen()};

    REQUIRE(ids.size() == 5);
    REQUIRE(ids.find(pod5::Uuid{}) != ids.end());
}

TEST_CASE("Test hashing", "[ops]")
{
    using namespace std::string_literals;
    auto str = "47183823-2574-4bfd-b411-99ed177d3e43"s;
    auto guid = pod5::Uuid::from_string(str).value();

    auto h1 = std::hash<std::string>{};
    auto h2 = std::hash<pod5::Uuid>{};
#ifdef UUID_HASH_STRING_BASED
    REQUIRE(h1(str) == h2(guid));
#else
    REQUIRE(h1(str) != h2(guid));
#endif

    auto engine = pod5::UuidRandomGenerator::engine_type{Catch::rngSeed()};
    pod5::UuidRandomGenerator gen{engine};

    std::unordered_set<pod5::Uuid> ids{pod5::Uuid{}, gen(), gen(), gen(), gen()};

    REQUIRE(ids.size() == 5);
    REQUIRE(ids.find(pod5::Uuid{}) != ids.end());
}

TEST_CASE("Test swap", "[ops]")
{
    pod5::Uuid empty;

    auto engine = pod5::UuidRandomGenerator::engine_type{Catch::rngSeed()};
    pod5::Uuid guid = pod5::UuidRandomGenerator{engine}();

    REQUIRE(empty.is_nil());
    REQUIRE_FALSE(guid.is_nil());

    std::swap(empty, guid);

    REQUIRE_FALSE(empty.is_nil());
    REQUIRE(guid.is_nil());

    empty.swap(guid);

    REQUIRE(empty.is_nil());
    REQUIRE_FALSE(guid.is_nil());
}

TEST_CASE("Test constexpr", "[const]")
{
    constexpr pod5::Uuid empty;
    static_assert(empty.is_nil());
}

TEST_CASE("Test size", "[operators]") { REQUIRE(sizeof(pod5::Uuid) == 16); }


================================================
FILE: ci/docker/Dockerfile.conda
================================================
FROM condaforge/mambaforge:latest
WORKDIR /


================================================
FILE: ci/docker/Dockerfile.py39.arm64
================================================
from git.oxfordnanolabs.local:4567/minknow/images/build-aarch64-gcc9

RUN yum groupinstall "Development Tools" -y
RUN yum install wget openssl-devel libffi-devel bzip2-devel -y
RUN wget https://www.python.org/ftp/python/3.9.10/Python-3.9.10.tgz
RUN tar xvf Python-*
WORKDIR Python-3.9.10/
RUN ./configure --enable-optimizations
RUN make altinstall
RUN rm /usr/bin/python3 && ln -s /usr/local/bin/python3.9 /usr/bin/python3

WORKDIR /


================================================
FILE: ci/docker/Dockerfile.py39.x64
================================================
from git.oxfordnanolabs.local:4567/minknow/images/build-x86_64-gcc9

RUN yum groupinstall "Development Tools" -y
RUN yum install wget openssl-devel libffi-devel bzip2-devel -y
RUN wget https://www.python.org/ftp/python/3.9.10/Python-3.9.10.tgz
RUN tar xvf Python-*
WORKDIR Python-3.9.10/
RUN ./configure --enable-optimizations
RUN make altinstall
RUN rm /usr/bin/python3 && ln -s /usr/local/bin/python3.9 /usr/bin/python3

WORKDIR /


================================================
FILE: ci/generate_coverage_report.sh
================================================
#!/bin/bash -e

# Parse args.
if [ $# -ne 1 ]; then
    echo "Usage: $0 build_dir"
    exit 1
fi
build_dir=$(realpath "$1")

# Set up the venv.
echo "Setting up venv"
if [ ! -e .coverage_venv ]; then
    python3 -m venv .coverage_venv
fi
# shellcheck disable=SC1091 # "Not following: .coverage_venv/bin/activate was not specified as input"
source .coverage_venv/bin/activate
# --cobertura support added in 5.1.
pip install -U 'gcovr>=5.1'

# Determine the root of the project.
# Note: shellcheck wants these split up into separate lines.
project_root=$(realpath "$0")
project_root=$(dirname "${project_root}")
project_root=$(dirname "${project_root}")
cd "${project_root}"

gcovr_args=(
    # work around https://gcc.gnu.org/bugzilla/show_bug.cgi?id=68080
    --gcov-ignore-parse-errors=negative_hits.warn
    --filter "${project_root}/c\+\+"
)

function generate_coverage {
    test_name=$1
    regex=$2

    echo "Generating coverage report for ${test_name}"

    # Clear out old coverage info.
    find "${project_root}" -name "*.gcda" -delete

    # Run the test.
    # shellcheck disable=SC2086 # the regex is intentionally split
    ctest --test-dir "${build_dir}" ${regex}

    # Generate the coverage report for this test.
    gcovr "${gcovr_args[@]}" --cobertura "${project_root}/coverage-report-${test_name}.xml"
    gcovr "${gcovr_args[@]}" --html-single-page --html-details "${project_root}/coverage-report-${test_name}.html"
}

# Generate a report for each test.
for test_name in $(ctest --test-dir "${build_dir}" -N | sed -rn 's/^ +Test +#[0-9]+: +(.*)$/\1/p'); do
    generate_coverage "${test_name}" "-R ^${test_name}\$"
done

# Generate a full coverage report too.
generate_coverage "all" ""

# CI wants to see a TOTAL line in order to report coverage, so give it the one from all tests.
# gcovr only has a resolution of 1%, so do the calculation ourselves.
gcovr "${gcovr_args[@]}" | grep TOTAL | awk '{print $1, $2, $3, 100 * $3 / $2 "%"}'


================================================
FILE: ci/get_tag_version.cmake
================================================
set(CANONICAL_TAG_BUILD TRUE)
include("${CMAKE_CURRENT_LIST_DIR}/../cmake/POD5Version.cmake")
message("${POD5_FULL_VERSION}")


================================================
FILE: ci/gitlab-ci-common.yml
================================================
variables:
    CONAN_USER: nanopore
    CONAN_CHANNEL: stable
    CONAN_REFERENCE: '.'
    # Location of the .conan dir: having it in $CI_PROJECT_DIR makes it easy to grab the packages as
    # artifacts, and putting it in a job-specific subdir allows multiple packages to be unpacked
    # into a single upload job (otherwise the metadata.json files would overwrite each other)
    CONAN_USER_HOME: '${CI_PROJECT_DIR}/${CI_JOB_ID}'
    PACKAGES_PER_VERSION: 2
    # can set this instead for the total number:
    #EXPECTED_PACKAGE_COUNT: 2

stages:
    - build
    - upload

before_script:
    - conan config install --verify-ssl=no "${CONAN_CONFIG_URL}"

#
# use the extends keyword to inherit the job templates defined below
#


.parallel-cppstd:
    # A matrix definition to allow conan builds with different cppstd
    parallel:
        matrix:
        - CONAN_PROFILE_CPPSTD: [17, 20]

.tarball-package: &tarball-package
    # gitlab-runner on Windows silently fails to archive files whose full path is longer than 260
    # characters; the MSYS `tar` command is not subject to this limitation (providing Windows has
    # been configured to allow long paths), so we tar up packages in the build job and untar them in
    # the upload job.
    #
    # This also allows us to only archive the package we just built, and not any of its dependencies
    # (because we can use `conan inspect` to find the name of the right packages).
    - PACKAGE_DIR="${CONAN_USER_HOME#${PWD}/}/.conan/data/$(conan inspect --raw name ${CONAN_REFERENCE})"
    - echo "Packing from $PACKAGE_DIR"
    - tar -czvf "conan-${CI_JOB_ID}.tar.gz" "$PACKAGE_DIR"/*/${CONAN_USER}/${CONAN_CHANNEL}/{package,metadata.json}
    - rm -rf "${CONAN_USER_HOME}/.conan"

.profile-variables: &profile-variables
    # The caller (an individual package) should have set up either PROFILE_BASE or PROFILE_BASE_HOST
    # and PROFILE_BASE_BUILD. We set variables so that both PROFILE_BASE_HOST and PROFILE_BASE_BUILD
    # are defined correctly after this call, or exit.
    - if [[ -n ${PROFILE_BASE} && ( -n ${PROFILE_BASE_HOST} || -n ${PROFILE_BASE_BUILD} ) ]]; then
    -     echo "Only one of PROFILE_BASE or (PROFILE_BASE_HOST and PROFILE_BASE_BUILD) should be defined"
    -     exit 1
    - fi
    - if [[ -n ${PROFILE_BASE} ]]; then
    -     PROFILE_BASE_HOST=${PROFILE_BASE}
    -     PROFILE_BASE_BUILD=${PROFILE_BASE}
    - fi
    - if [[ -z ${PROFILE_BASE_HOST} || -z ${PROFILE_BASE_BUILD} ]]; then
    -     echo "Both PROFILE_BASE_HOST and PROFILE_BASE_BUILD variables need to be defined"
    -     exit 1
    - fi

.build-package:
    # The script builds all required conan packages. The caller needs to set up:
    #     Either PROFILE_BASE or both PROFILE_BASE_HOST and PROFILE_BASE_BUILD
    #     VERSIONS as an array if one or more version numbers are wanted.
    #     EXTRA_CREATE_ARGS is passed to conan unchanged, if present.
    #
    # EXTRA_CREATE_ARGS is only used by libcurl, which builds the libcurl in parallel with c_ares
    # set to True and to False.
    #
    #
    # The after_script removes unneeded builds and sources and packages everything into a tarball,
    # artifacts defines the name and path for build artifacts.
    stage: build
    variables:
        # For Linux we need to tell arrow to not use boost.
        EXTRA_CREATE_ARGS: "-o arrow:with_boost=False -o arrow:with_thrift=False -o arrow:parquet=False -o arrow:with_zstd=True"
    script:
        - *profile-variables
        - |
            if [[ -n ${VERSIONS} ]]; then
                for version in ${VERSIONS}; do
                    export CONAN_PROFILE_BUILD_TYPE=Debug
                    conan create --profile:build ${PROFILE_BASE_BUILD} --profile:host ${PROFILE_BASE_HOST} ${CONAN_REFERENCE} ${version}@${CONAN_USER}/${CONAN_CHANNEL} ${EXTRA_CREATE_ARGS}
                    export CONAN_PROFILE_BUILD_TYPE=Release
                    conan create --profile:build ${PROFILE_BASE_BUILD} --profile:host ${PROFILE_BASE_HOST} ${CONAN_REFERENCE} ${version}@${CONAN_USER}/${CONAN_CHANNEL} ${EXTRA_CREATE_ARGS}
                done
            else
                export CONAN_PROFILE_BUILD_TYPE=Debug
                conan create --profile:build ${PROFILE_BASE_BUILD} --profile:host ${PROFILE_BASE_HOST}  ${CONAN_REFERENCE} ${CONAN_USER}/${CONAN_CHANNEL} ${EXTRA_CREATE_ARGS}
                export CONAN_PROFILE_BUILD_TYPE=Release
                conan create --profile:build ${PROFILE_BASE_BUILD} --profile:host ${PROFILE_BASE_HOST} ${CONAN_REFERENCE} ${CONAN_USER}/${CONAN_CHANNEL} ${EXTRA_CREATE_ARGS}
            fi
    after_script:
        # Re-load the venv if it exists
        - if ls .venv/*/activate >/dev/null 2>&1; then source .venv/*/activate; fi
        - conan --version
        # Avoid storing things on the CI node unnecessarily
        - conan remove "*" --builds --src --force
        - *tarball-package
    artifacts:
        name: "${CI_PROJECT_NAME}-${CI_JOB_ID}"
        paths:
            - 'conan-*.tar.gz'

.build-package-win:
    # Almost the same as build-package. Sets two additional variables CONAN_USER_HOME_SHORT and
    # CONAN_USE_ALWAYS_SHORT_PATHS. "script" is exactly the same as for build-package. "after_script"
    # does some additional processing needed for Windows between removing conan builds and sources,
    # and creating tarballs.
    extends: .build-package
    variables:
        # avoid interfering with the standard conan short-path directory
        CONAN_USER_HOME_SHORT: 'c:\.conan-tmp'
        # we're nesting conan's data dir pretty deep, so build systems that would normally be ok can
        # fail if we don't use short paths
        CONAN_USE_ALWAYS_SHORT_PATHS: '1'
        # We need to override arrow's boost 1.85.0 requirement to match the version we use internally.
        EXTRA_CREATE_ARGS: "-o arrow:with_thrift=False -o arrow:parquet=False --require=boost/1.86.0@ -o boost:without_locale=True"

    after_script:
        # Avoid storing things on the CI node unnecessarily
        - conan remove "*" --builds --src --force
        # CONAN_USE_ALWAYS_SHORT_PATHS links paths deep in the data dir to dirs in c:\.conan
        # Resolve package links (so they can be gathered into artifacts):
        - shopt -s nullglob # allow there to be nothing, eg: if CONAN_USE_ALWAYS_SHORT_PATHS is off
        # MOVE_COMMAND can be set to, say, "cp -r" if necessary. Moving has been seen to fail for
        # packages with executables (especially if those executables are run as part of the test
        # package), such as protobuf.
        - for link in ${CONAN_USER_HOME}/.conan/data/*/*/$CONAN_USER/$CONAN_CHANNEL/package/*/.conan_link; do
            source=$(cat $link) && ${MOVE_COMMAND:-mv} $(cygpath "$source")/* $(dirname $link) && rm $link;
          done
        # Clean up the short_paths folder (even on failure):
        - rm -rf "/c/.conan-tmp"
        - *tarball-package

# This can be used to override the script stage to build both static and shared versions of a
# library. The "conan create" commands are duplicates with either -o ${PACKAGE}:shared=False or
# -o ${PACKAGE}:shared=True added. Since this doesn't use "extends" the caller has to extend
# either build-package or build-package-win as well.
.build-shared-and-static:
    script:
        - *profile-variables
        - PACKAGE="$(conan inspect --raw name .)"
        - if [[ -n ${VERSIONS} ]]; then
        -   for version in ${VERSIONS}; do
        -     export CONAN_PROFILE_BUILD_TYPE=Debug
        -     conan create --profile:build ${PROFILE_BASE_BUILD}
                --profile:host ${PROFILE_BASE_HOST} ${CONAN_REFERENCE}
                ${version}@${CONAN_USER}/${CONAN_CHANNEL}
                -o ${PACKAGE}:shared=False
                ${EXTRA_CREATE_ARGS}
        -     conan create --profile:build ${PROFILE_BASE_BUILD}
                --profile:host ${PROFILE_BASE_HOST} ${CONAN_REFERENCE}
                ${version}@${CONAN_USER}/${CONAN_CHANNEL}
                -o ${PACKAGE}:shared=True
                ${EXTRA_CREATE_ARGS}
        -     export CONAN_PROFILE_BUILD_TYPE=Release
        -     conan create --profile:build ${PROFILE_BASE_BUILD}
                --profile:host ${PROFILE_BASE_HOST} ${CONAN_REFERENCE}
                ${version}@${CONAN_USER}/${CONAN_CHANNEL}
                -o ${PACKAGE}:shared=False
                ${EXTRA_CREATE_ARGS}
        -     conan create --profile:build ${PROFILE_BASE_BUILD}
                --profile:host ${PROFILE_BASE_HOST} ${CONAN_REFERENCE}
                ${version}@${CONAN_USER}/${CONAN_CHANNEL}
                -o ${PACKAGE}:shared=True
                ${EXTRA_CREATE_ARGS}
        -   done
        - else
        -   export CONAN_PROFILE_BUILD_TYPE=Debug
        -   conan create --profile:build ${PROFILE_BASE_BUILD}
              --profile:host ${PROFILE_BASE_HOST} ${CONAN_REFERENCE}
              ${CONAN_USER}/${CONAN_CHANNEL}
              -o ${PACKAGE}:shared=False
              ${EXTRA_CREATE_ARGS}
        -   conan create --profile:build ${PROFILE_BASE_BUILD}
              --profile:host ${PROFILE_BASE_HOST} ${CONAN_REFERENCE}
              ${CONAN_USER}/${CONAN_CHANNEL}
              -o ${PACKAGE}:shared=True
              ${EXTRA_CREATE_ARGS}
        -   export CONAN_PROFILE_BUILD_TYPE=Release
        -   conan create --profile:build ${PROFILE_BASE_BUILD}
              --profile:host ${PROFILE_BASE_HOST} ${CONAN_REFERENCE}
              ${CONAN_USER}/${CONAN_CHANNEL}
              -o ${PACKAGE}:shared=False
              ${EXTRA_CREATE_ARGS}
        -   conan create --profile:build ${PROFILE_BASE_BUILD}
              --profile:host ${PROFILE_BASE_HOST} ${CONAN_REFERENCE}
              ${CONAN_USER}/${CONAN_CHANNEL}
              -o ${PACKAGE}:shared=True
              ${EXTRA_CREATE_ARGS}
        - fi

.upload-package:
    stage: upload
    image: git.oxfordnanolabs.local:4567/traque/ont-docker-base/ont-base-python:3.8
    tags:
        - linux
        - docker
    before_script:
        - echo -e "\e[0Ksection_start:`date +%s`:install_conan[collapsed=true]\r\e[0KInstalling conan"
        - pip install 'conan<2'
        - echo -e "\e[0Ksection_end:`date +%s`:install_conan\r\e[0K"
    script:
        # BSD tar (on macOS) puts some extra optional information into the tarballs that GNU tar
        # complains about. --warning=no-unknown-keyword suppresses this.
        - for tarball in conan-*.tar.gz; do tar --warning=no-unknown-keyword -xf "$tarball"; done
        - for conan_dir in ./*/.conan; do
        - job_dir="$(dirname "$conan_dir")"
        - echo -e "\e[0Ksection_start:`date +%s`:upload_package\r\e[0KUploading from $job_dir"
        - export CONAN_USER_HOME="$PWD/$job_dir"
        - conan config install --verify-ssl=no "${CONAN_CONFIG_URL}"
        - if [[ -n ${VERSIONS} ]]; then
        -     expected_recipe_count=$(echo ${VERSIONS} | wc -w)
        -     for version in ${VERSIONS}; do
        -         conan export ${CONAN_REFERENCE} ${version}@${CONAN_USER}/${CONAN_CHANNEL}
        -     done
        - else
        -     expected_recipe_count=1
        -     conan export ${CONAN_REFERENCE} ${CONAN_USER}/${CONAN_CHANNEL}
        - fi
        - PACKAGE="$(conan inspect --raw name ${CONAN_REFERENCE})"
        - recipes="$(conan search --raw "${PACKAGE}/*@${CONAN_USER}/${CONAN_CHANNEL}")"
        - recipe_count="$(echo $recipes | wc -w)"
        - package_count=0
        - for recipe in $recipes; do
        -   echo "${recipe}:"
        -   conan search "$recipe"
        -   package_count=$(($package_count + $(conan search "$recipe" | grep "Package_ID:" | wc -l)))
        - done
        - if [[ -z $EXPECTED_PACKAGE_COUNT ]]; then
        -   EXPECTED_PACKAGE_COUNT=$((PACKAGES_PER_VERSION * expected_recipe_count))
        - fi
        - if [[ $recipe_count -ne $expected_recipe_count ]] || [[ $package_count -ne $EXPECTED_PACKAGE_COUNT ]]; then
        -     echo "Expected $expected_recipe_count recipe(s) with $EXPECTED_PACKAGE_COUNT package(s), got $recipe_count recipe(s) with $package_count package(s)"
        -     exit 1
        - fi
        # conan claims it should pick this information up automatically, given the variable names,
        # but it doesn't seem to work if you don't do this:
        - conan user -r ont-artifactory -p "${CONAN_PASSWORD}" "${CONAN_LOGIN_USERNAME}"
        - EXTRA_ARGS=
        - if [[ -z $DO_UPLOAD ]]; then
        -   DO_UPLOAD=no
        -   if [[ $CI_COMMIT_REF_NAME == stable/* ]] || [[ $CI_COMMIT_REF_NAME == release/* ]] || [[ $CI_COMMIT_REF_NAME == $STABLE_BRANCH_NAME ]]; then
        -     DO_UPLOAD=yes
        -   fi
        - fi
        - if [[ $DO_UPLOAD == "yes" ]]; then
        -   EXTRA_ARGS=--force
        - else
        -   'echo "WARNING: NOT uploading to artifactory for this branch"'
        -   EXTRA_ARGS=--skip-upload
        - fi
        - for recipe in $recipes; do
        -   conan upload -r ont-artifactory --all --check --confirm ${EXTRA_ARGS} "$recipe"
        - done
        - echo -e "\e[0Ksection_end:`date +%s`:upload_package\r\e[0K"
        - done # for conan_dir

#
# Various setup methods. Each sets a number of relevant tags, and one or two variables: For
# non-cross compiling one variable PROFILE_BASE is set with the name of a profile which will be
# adapted by adding "" or "". For cross compiling two variables PROFILE_BASE_BUILD
# for the profile of the build machine and PROFILE_BASE_HOST for the host machine are set.
#

#
# Set up for Windows versions
#
.profile-windows-x86_64-vs2019:
    # Set up for Windows x86 using VS 2019, using conan and the profile windows-x86_64-vs2019,
    # adapted for debug and release. To be called from individual packages by using "extends".
    tags:
        - windows
        - cmake
        - VS2019
        - conan
    variables:
        PROFILE_BASE: windows-x86_64-vs2019.jinja
    parallel: !reference [.parallel-cppstd,parallel]

.profile-windows-x86_64-vs2019-conan2:
    # Set up for Windows x86 using VS 2019, using conan and the profile windows-x86_64-vs2019,
    # adapted for debug and release. To be called from individual packages by using "extends".
    tags:
        - windows
        - cmake
        - VS2019
        - conan
    variables:
        CMAKE_GENERATOR: "Visual Studio 16 2019"
        PROFILE_BASE: windows-x86_64-vs2019.jinja
        CMAKE_PRESET: "conan2-windows-x86_64-vs2019-cppstd${CONAN_PROFILE_CPPSTD}-release"

#
# Set up for MacOS versions
#
.profile-macos-aarch64-appleclang-15.0:
    # Set up for MacOS arm 64 using clang 15.0, using conan and the profile
    # macos-aarch64-appleclang-15.0, adapted for debug and release. To be called from individual
    # packages by using "extends".
    tags:
        - osx_arm64
        - xcode-15.3
        - conan
    variables:
        PROFILE_BASE: macos-aarch64-appleclang-15.0.jinja
    parallel: !reference [.parallel-cppstd,parallel]

.profile-macos-aarch64-appleclang-16.0:
    # Set up for MacOS arm 64 using clang 16.0, using conan and the profile
    # macos-aarch64-appleclang-16.0, adapted for debug and release. To be called from individual
    # packages by using "extends".
    tags:
        - osx_arm64
        - xcode-16.1
        - conan
    variables:
        PROFILE_BASE: macos-aarch64-appleclang-16.0.jinja
    parallel: !reference [.parallel-cppstd,parallel]

.profile-macos-aarch64-appleclang-15.0-conan2:
    # Set up for MacOS arm 64 using clang 15.0, using conan and the profile
    # macos-aarch64-appleclang-15.0, adapted for debug and release. To be called from individual
    # packages by using "extends".
    tags:
        - osx_arm64
        - xcode-15.3
        - conan
    variables:
        PROFILE_BASE: macos-aarch64-appleclang-15.0.jinja
        CMAKE_PRESET: "conan2-macos-appleclang-15.0-aarch64-cppstd${CONAN_PROFILE_CPPSTD}-release"

.profile-macos-aarch64-appleclang-16.0-conan2:
    # Set up for MacOS arm 64 using clang 16.0, using conan and the profile
    # macos-aarch64-appleclang-16.0, adapted for debug and release. To be called from individual
    # packages by using "extends".
    tags:
        - osx_arm64
        - xcode-16.1
        - conan
    variables:
        PROFILE_BASE: macos-aarch64-appleclang-16.0.jinja
        CMAKE_PRESET: "conan2-macos-appleclang-16.0-aarch64-cppstd${CONAN_PROFILE_CPPSTD}-release"
#
# Set up for linux versions
#
.profile-linux-x86_64-gcc9:
    # Set up for linux x86 using gcc9, using docker and the profile linux-x86_64-gcc9, adapted
    # for debug and release. To be called from individual packages by using "extends".
    #
    # The docker image builds on CentOS 7 using devtoolset-9, for maximum compatibility. This means
    # the compiled code will work on any Ubuntu distro from Xenial onwards (and most other
    # still-supported Linux distros). Differences between GCC 9's libstdc++ and GCC 4.8's libstdc++
    # are handled by a static library, so no special handling of libstdc++ is required.
    image: git.oxfordnanolabs.local:4567/informatics/conan-config/linux-x86_64-gcc9:latest
    tags:
        - linux_x86
        - docker
    variables:
        PROFILE_BASE: linux-x86_64-gcc9.jinja
    parallel: !reference [.parallel-cppstd,parallel]

.profile-linux-x86_64-gcc9-conan2:
    image: git.oxfordnanolabs.local:4567/informatics/conan-config/linux-x86_64-gcc9:latest
    tags:
        - linux_x86
        - docker
    variables:
        PROFILE_BASE: linux-x86_64-gcc9.jinja
        CMAKE_PRESET: "conan2-linux-gcc9-x86_64-cppstd${CONAN_PROFILE_CPPSTD}-release"


.profile-linux-x86_64-gcc11:
    # Set up for linux x86 using gcc11, using docker and the profile linux-aarch64-gcc11, adapted
    # for debug and release. To be called from individual packages by using "extends".
    #
    # Note that the docker image uses a GCC 11 backport to Ubuntu Bionic. Compiled artifacts will
    # be mostly compatible with Ubuntu Bionic and later, except that they will need the correct
    # libstdc++ to be available. This can be achieved by installing libstdc++6 from the GCC 11
    # backport (available in the ~ubuntu-toolchain-r/test PPA), or by otherwise shipping that
    # version of libstdc++6 in a way that the software can find it.
    image: git.oxfordnanolabs.local:4567/informatics/conan-config/linux-x86_64-gcc11:latest
    tags:
        - linux_x86
        - docker
    variables:
        PROFILE_BASE: linux-x86_64-gcc11.jinja
    parallel: !reference [.parallel-cppstd,parallel]

.profile-linux-x86_64-gcc11-conan2:
    image: git.oxfordnanolabs.local:4567/informatics/conan-config/linux-x86_64-gcc11:latest
    tags:
        - linux_x86
        - docker
    variables:
        PROFILE_BASE: linux-x86_64-gcc11.jinja
        CMAKE_PRESET: "conan2-linux-gcc11-x86_64-cppstd${CONAN_PROFILE_CPPSTD}-release"

.profile-linux-x86_64-gcc11-asan-static-conan2:
    image: git.oxfordnanolabs.local:4567/informatics/conan-config/linux-x86_64-gcc11:latest
    tags:
        - linux_x86
        - docker
    variables:
        PROFILE_BASE: linux-x86_64-gcc11-asan-static.jinja
        CMAKE_PRESET: "conan2-linux-gcc11-asan-static-x86_64-cppstd${CONAN_PROFILE_CPPSTD}-release"

.profile-linux-x86_64-gcc11-usan-static-conan2:
    image: git.oxfordnanolabs.local:4567/informatics/conan-config/linux-x86_64-gcc11:latest
    tags:
        - linux_x86
        - docker
    variables:
        PROFILE_BASE: linux-x86_64-gcc11-usan-static.jinja
        CMAKE_PRESET: "conan2-linux-gcc11-usan-static-x86_64-cppstd${CONAN_PROFILE_CPPSTD}-release"

.profile-linux-x86_64-gcc11-tsan-static-conan2:
    image: git.oxfordnanolabs.local:4567/informatics/conan-config/linux-x86_64-gcc11:latest
    tags:
        - linux_x86
        - docker
    variables:
        PROFILE_BASE: linux-x86_64-gcc11-tsan-static.jinja
        CMAKE_PRESET: "conan2-linux-gcc11-tsan-static-x86_64-cppstd${CONAN_PROFILE_CPPSTD}-release"

.profile-linux-x86_64-gcc11-asan-static:
    image: git.oxfordnanolabs.local:4567/informatics/conan-config/linux-x86_64-gcc11:latest
    tags:
        - linux_x86
        - docker
    variables:
        PROFILE_BASE: linux-x86_64-gcc11-asan-static.jinja
    parallel: !reference [.parallel-cppstd,parallel]

.profile-linux-x86_64-gcc11-ausan-static:
    image: git.oxfordnanolabs.local:4567/informatics/conan-config/linux-x86_64-gcc11:latest
    tags:
        - linux_x86
        - docker
    variables:
        PROFILE_BASE: linux-x86_64-gcc11-ausan-static.jinja
    parallel: !reference [.parallel-cppstd,parallel]

.profile-linux-x86_64-gcc11-tsan-static:
    image: git.oxfordnanolabs.local:4567/informatics/conan-config/linux-x86_64-gcc11:latest
    tags:
        - linux_x86
        - docker
    variables:
        PROFILE_BASE: linux-x86_64-gcc11-tsan-static.jinja
    parallel: !reference [.parallel-cppstd,parallel]

.profile-linux-x86_64-gcc11-usan-static:
    image: git.oxfordnanolabs.local:4567/informatics/conan-config/linux-x86_64-gcc11:latest
    tags:
        - linux_x86
        - docker
    variables:
        PROFILE_BASE: linux-x86_64-gcc11-usan-static.jinja
    parallel: !reference [.parallel-cppstd,parallel]

.profile-linux-x86_64-gcc13:
    image: git.oxfordnanolabs.local:4567/informatics/conan-config/linux-x86_64-gcc13:latest
    tags:
        - linux_x86
        - docker
    variables:
        PROFILE_BASE: linux-x86_64-gcc13.jinja
    parallel: !reference [.parallel-cppstd,parallel]

.profile-linux-x86_64-gcc13-conan2:
    image: git.oxfordnanolabs.local:4567/informatics/conan-config/linux-x86_64-gcc13:latest
    tags:
        - linux_x86
        - docker
    variables:
        PROFILE_BASE: linux-x86_64-gcc13.jinja
        CMAKE_PRESET: "conan2-linux-gcc13-x86_64-cppstd${CONAN_PROFILE_CPPSTD}-release"

.profile-linux-x86_64-gcc13-asan-static:
    extends: .profile-linux-x86_64-gcc13
    variables:
        PROFILE_BASE: linux-x86_64-gcc13-asan-static.jinja

.profile-linux-x86_64-gcc13-tsan-static:
    extends: .profile-linux-x86_64-gcc13
    variables:
        PROFILE_BASE: linux-x86_64-gcc13-tsan-static.jinja

.profile-linux-x86_64-gcc13-usan-static:
    extends: .profile-linux-x86_64-gcc13
    variables:
        PROFILE_BASE: linux-x86_64-gcc13-usan-static.jinja


.profile-linux-aarch64-gcc9:
    # Set up for linux arm64 using gcc9, using docker and the profile linux-aarch64-gcc9, adapted
    # for debug and release. To be called from individual packages by using "extends".
    #
    # The docker image builds on CentOS 7 using devtoolset-9, for maximum compatibility. This means
    # the compiled code will work on any Ubuntu distro from Xenial onwards (and most other
    # still-supported Linux distros). Differences between GCC 9's libstdc++ and GCC 4.8's libstdc++
    # are handled by a static library, so no special handling of libstdc++ is required.
    image: git.oxfordnanolabs.local:4567/informatics/conan-config/linux-aarch64-gcc9:latest
    tags:
        - linux_aarch64
        - docker
    variables:
        PROFILE_BASE: linux-aarch64-gcc9.jinja
    parallel: !reference [.parallel-cppstd,parallel]

.profile-linux-aarch64-gcc9-conan2:
    image: git.oxfordnanolabs.local:4567/informatics/conan-config/linux-aarch64-gcc9:latest
    tags:
        - linux_aarch64
        - docker
    variables:
        PROFILE_BASE: linux-aarch64-gcc9.jinja
        CMAKE_PRESET: "conan2-linux-gcc9-aarch64-cppstd${CONAN_PROFILE_CPPSTD}-release"

.profile-linux-aarch64-gcc11:
    # Set up for linux arm64 using gcc11, using docker and the profile linux-aarch64-gcc11, adapted
    # for debug and release. To be called from individual packages by using "extends".
    #
    # Note that the docker image uses a GCC 11 backport to Ubuntu Bionic. Compiled artifacts will
    # be mostly compatible with Ubuntu Bionic and later, except that they will need the correct
    # libstdc++ to be available. This can be achieved by installing libstdc++6 from the GCC 11
    # backport (available in the ~ubuntu-toolchain-r/test PPA), or by otherwise shipping that
    # version of libstdc++6 in a way that the software can find it.
    image: git.oxfordnanolabs.local:4567/informatics/conan-config/linux-aarch64-gcc11:latest
    tags:
        - linux_aarch64
        - docker
    variables:
        PROFILE_BASE: linux-aarch64-gcc11.jinja
    parallel: !reference [.parallel-cppstd,parallel]

.profile-linux-aarch64-gcc11-conan2:
    image: git.oxfordnanolabs.local:4567/informatics/conan-config/linux-aarch64-gcc11:latest
    tags:
        - linux_aarch64
        - docker
    variables:
        PROFILE_BASE: linux-aarch64-gcc11.jinja
        CMAKE_PRESET: "conan2-linux-gcc11-aarch64-cppstd${CONAN_PROFILE_CPPSTD}-release"

.profile-linux-aarch64-gcc13:
    image: git.oxfordnanolabs.local:4567/informatics/conan-config/linux-aarch64-gcc13:latest
    tags:
        - linux_aarch64
        - docker
    variables:
        PROFILE_BASE: linux-aarch64-gcc13.jinja
    parallel: !reference [.parallel-cppstd,parallel]

.profile-linux-aarch64-gcc13-conan2:
    image: git.oxfordnanolabs.local:4567/informatics/conan-config/linux-aarch64-gcc13:latest
    tags:
        - linux_aarch64
        - docker
    variables:
        PROFILE_BASE: linux-aarch64-gcc13.jinja
        CMAKE_PRESET: "conan2-linux-gcc13-aarch64-cppstd${CONAN_PROFILE_CPPSTD}-release"


================================================
FILE: ci/install.sh
================================================
#!/bin/bash

set -o errexit
set -o pipefail
set -o nounset
# set -o xtrace

# Tar up the archive build:
(
    cmake -DCMAKE_INSTALL_PREFIX="archive" -DBUILD_TYPE="Release" -DCOMPONENT="archive" -P "cmake_install.cmake"
    if [ "$#" -ge 1 ] && [ "$1" == "STATIC_BUILD" ]; then
        if [[ "$OSTYPE" == "linux-gnu"* ]] && [[ -e "archive/lib64" ]]; then
            cp "../build/third_party/libs"/* "archive/lib64"
        else
            cp "../build/third_party/libs"/* "archive/lib"
        fi
    fi
)

# Find the wheel:
(
    cmake -DCMAKE_INSTALL_PREFIX="wheel" -DBUILD_TYPE="Release" -DCOMPONENT="wheel" -P "cmake_install.cmake"
)


================================================
FILE: ci/package.sh
================================================
#!/bin/bash

set -o errexit
set -o pipefail
set -o nounset
# set -o xtrace

output_sku=$1
auditwheel_platform=
if [ $# -gt 1 ]; then
    auditwheel_platform="${2}"
fi

CURRENT_DIR=$(pwd)

SCRIPT_DIR=$( cd -- "$( dirname -- "${BASH_SOURCE[0]}" )" &> /dev/null && pwd )
REPO_ROOT="${SCRIPT_DIR}/../"

cd "${REPO_ROOT}"
pod5_version="$(cmake -P ci/get_tag_version.cmake 2>&1)"

cd "${CURRENT_DIR}"

# Tar up the archive build:
(
    cd ./archive
    tar -cvzf "${REPO_ROOT}/lib_pod5-${pod5_version}-${output_sku}.tar.gz" .
)

# Find the wheel:
(
    # Wheels are optional:
    if [ -d "wheel/" ] ; then
        cd wheel/
        if [ -z "${auditwheel_platform}" ]; then
            mv ./*.whl "${REPO_ROOT}/"
        else
            echo "Running audit wheel"
            pwd
            ls
            auditwheel repair ./*.whl --plat "${auditwheel_platform}" -w "${REPO_ROOT}/"
        fi
    fi
)


================================================
FILE: ci/unpack_libs_for_python.sh
================================================
#!/bin/bash

input_dir=$1
output_dir=$2

echo "Unpacking builds from $input_dir to $output_dir"

file_regex=".*/lib_pod5-[0-9\.]*-(.*).tar.gz"
for i in "${input_dir}"/lib_pod5*.tar.gz; do

    if [[ $i =~ $file_regex ]]
    then
        sku="${BASH_REMATCH[1]}"
        echo "Extracting for SKU: $sku"
    else
        echo "$i doesn't match expected file pattern" >&2
        exit 1
    fi

    sku_out_dir="$output_dir/$sku/"
    mkdir -p "${sku_out_dir}"

    tmp_dir="$output_dir/tmp"
    mkdir -p "$tmp_dir"
    tar -xzf "$i" --directory "$output_dir/tmp"

    mv "${tmp_dir}"/lib/* "${sku_out_dir}"

    rm -r "$tmp_dir"
done

echo "unpacked skus:"
ls "${output_dir}/"
echo "contents:"
ls "${output_dir}"/*


================================================
FILE: cmake/BuildFlatBuffers.cmake
================================================
# Copyright 2015 Google Inc. All rights reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

# General function to create FlatBuffer build rules for the given list of
# schemas.
#
# flatbuffers_schemas: A list of flatbuffer schema files to process.
#
# schema_include_dirs: A list of schema file include directories, which will be
# passed to flatc via the -I parameter.
#
# custom_target_name: The generated files will be added as dependencies for a
# new custom target with this name. You should add that target as a dependency
# for your main target to ensure these files are built. You can also retrieve
# various properties from this target, such as GENERATED_INCLUDES_DIR,
# BINARY_SCHEMAS_DIR, and COPY_TEXT_SCHEMAS_DIR.
#
# additional_dependencies: A list of additional dependencies that you'd like
# all generated files to depend on. Pass in a blank string if you have none.
#
# generated_includes_dir: Where to generate the C++ header files for these
# schemas. The generated includes directory will automatically be added to
# CMake's include directories, and will be where generated header files are
# placed. This parameter is optional; pass in empty string if you don't want to
# generate include files for these schemas.
#
# binary_schemas_dir: If you specify an optional binary schema directory, binary
# schemas will be generated for these schemas as well, and placed into the given
# directory.
#
# copy_text_schemas_dir: If you want all text schemas (including schemas from
# all schema include directories) copied into a directory (for example, if you
# need them within your project to build JSON files), you can specify that
# folder here. All text schemas will be copied to that folder.
#
# IMPORTANT: Make sure you quote all list arguments you pass to this function!
# Otherwise CMake will only pass in the first element.
# Example: build_flatbuffers("${fb_files}" "${include_dirs}" target_name ...)
function(build_flatbuffers flatbuffers_schemas
                           schema_include_dirs
                           custom_target_name
                           additional_dependencies
                           generated_includes_dir
                           binary_schemas_dir
                           copy_text_schemas_dir)

  # Test if including from FindFlatBuffers
  if(FLATBUFFERS_FLATC_EXECUTABLE)
    set(FLATC_TARGET "")
    set(FLATC ${FLATBUFFERS_FLATC_EXECUTABLE})
  else()
    set(FLATC_TARGET flatc)
    set(FLATC flatc)
  endif()
  set(FLATC_SCHEMA_ARGS --gen-mutable)
  if(FLATBUFFERS_FLATC_SCHEMA_EXTRA_ARGS)
    set(FLATC_SCHEMA_ARGS
      ${FLATBUFFERS_FLATC_SCHEMA_EXTRA_ARGS}
      ${FLATC_SCHEMA_ARGS}
      )
  endif()

  set(working_dir "${CMAKE_CURRENT_SOURCE_DIR}")

  set(schema_glob "*.fbs")
  # Generate the include files parameters.
  set(include_params "")
  set(all_generated_files "")
  foreach (include_dir ${schema_include_dirs})
    set(include_params -I ${include_dir} ${include_params})
    if (NOT ${copy_text_schemas_dir} STREQUAL "")
      # Copy text schemas from dependent folders.
      file(GLOB_RECURSE dependent_schemas ${include_dir}/${schema_glob})
      foreach (dependent_schema ${dependent_schemas})
        file(COPY ${dependent_schema} DESTINATION ${copy_text_schemas_dir})
      endforeach()
    endif()
  endforeach()

  foreach(schema ${flatbuffers_schemas})
    get_filename_component(filename ${schema} NAME_WE)
    # For each schema, do the things we requested.
    if (NOT ${generated_includes_dir} STREQUAL "")
      set(generated_include ${generated_includes_dir}/${filename}_generated.h)
      add_custom_command(
        OUTPUT ${generated_include}
        COMMAND ${FLATC} ${FLATC_SCHEMA_ARGS}
        -o ${generated_includes_dir}
        ${include_params}
        -c ${schema}
        DEPENDS ${FLATC_TARGET} ${schema} ${additional_dependencies}
        WORKING_DIRECTORY "${working_dir}")
      list(APPEND all_generated_files ${generated_include})
    endif()

    if (NOT ${binary_schemas_dir} STREQUAL "")
      set(binary_schema ${binary_schemas_dir}/${filename}.bfbs)
      add_custom_command(
        OUTPUT ${binary_schema}
        COMMAND ${FLATC} -b --schema
        -o ${binary_schemas_dir}
        ${include_params}
        ${schema}
        DEPENDS ${FLATC_TARGET} ${schema} ${additional_dependencies}
        WORKING_DIRECTORY "${working_dir}")
      list(APPEND all_generated_files ${binary_schema})
    endif()

    if (NOT ${copy_text_schemas_dir} STREQUAL "")
      file(COPY ${schema} DESTINATION ${copy_text_schemas_dir})
    endif()
  endforeach()

  # Create a custom target that depends on all the generated files.
  # This is the target that you can depend on to trigger all these
  # to be built.
  add_custom_target(${custom_target_name}
                    DEPENDS ${all_generated_files} ${additional_dependencies})

  # Register the include directory we are using.
  if (NOT ${generated_includes_dir} STREQUAL "")
    include_directories(${generated_includes_dir})
    set_property(TARGET ${custom_target_name}
      PROPERTY GENERATED_INCLUDES_DIR
      ${generated_includes_dir})
  endif()

  # Register the binary schemas dir we are using.
  if (NOT ${binary_schemas_dir} STREQUAL "")
    set_property(TARGET ${custom_target_name}
      PROPERTY BINARY_SCHEMAS_DIR
      ${binary_schemas_dir})
  endif()

  # Register the text schema copy dir we are using.
  if (NOT ${copy_text_schemas_dir} STREQUAL "")
    set_property(TARGET ${custom_target_name}
      PROPERTY COPY_TEXT_SCHEMAS_DIR
      ${copy_text_schemas_dir})
  endif()
endfunction()

# Creates a target that can be linked against that generates flatbuffer headers.
#
# This function takes a target name and a list of schemas. You can also specify
# other flagc flags using the FLAGS option to change the behavior of the flatc
# tool.
#
# Arguments:
#   TARGET: The name of the target to generate.
#   SCHEMAS: The list of schema files to generate code for.
#   BINARY_SCHEMAS_DIR: Optional. The directory in which to generate binary
#       schemas. Binary schemas will only be generated if a path is provided.
#   INCLUDE: Optional. Search for includes in the specified paths. (Use this
#       instead of "-I <path>" and the FLAGS option so that CMake is aware of
#       the directories that need to be searched).
#   INCLUDE_PREFIX: Optional. The directory in which to place the generated
#       files. Use this instead of the --include-prefix option.
#   FLAGS: Optional. A list of any additional flags that you would like to pass
#       to flatc.
#
# Example:
#
#     flatbuffers_generate_headers(
#         TARGET my_generated_headers_target
#         INCLUDE_PREFIX ${MY_INCLUDE_PREFIX}"
#         SCHEMAS ${MY_SCHEMA_FILES}
#         BINARY_SCHEMAS_DIR "${MY_BINARY_SCHEMA_DIRECTORY}"
#         FLAGS --gen-object-api)
#
#     target_link_libraries(MyExecutableTarget
#         PRIVATE my_generated_headers_target
#     )
function(flatbuffers_generate_headers)
  # Parse function arguments.
  set(options)
  set(one_value_args
    "TARGET"
    "INCLUDE_PREFIX"
    "BINARY_SCHEMAS_DIR")
  set(multi_value_args
    "SCHEMAS"
    "INCLUDE"
    "FLAGS")
  cmake_parse_arguments(
    PARSE_ARGV 0
    FLATBUFFERS_GENERATE_HEADERS
    "${options}"
    "${one_value_args}"
    "${multi_value_args}")

  # Test if including from FindFlatBuffers
  if(FLATBUFFERS_FLATC_EXECUTABLE)
    set(FLATC_TARGET "")
    set(FLATC ${FLATBUFFERS_FLATC_EXECUTABLE})
  else()
    set(FLATC_TARGET flatc)
    set(FLATC flatc)
  endif()

  set(working_dir "${CMAKE_CURRENT_SOURCE_DIR}")

  # Generate the include files parameters.
  set(include_params "")
  foreach (include_dir ${FLATBUFFERS_GENERATE_HEADERS_INCLUDE})
    set(include_params -I ${include_dir} ${include_params})
  endforeach()

  # Create a directory to place the generated code.
  set(generated_target_dir "${CMAKE_CURRENT_BINARY_DIR}/${FLATBUFFERS_GENERATE_HEADERS_TARGET}")
  set(generated_include_dir "${generated_target_dir}")
  if (NOT ${FLATBUFFERS_GENERATE_HEADERS_INCLUDE_PREFIX} STREQUAL "")
    set(generated_include_dir "${generated_include_dir}/${FLATBUFFERS_GENERATE_HEADERS_INCLUDE_PREFIX}")
    list(APPEND FLATBUFFERS_GENERATE_HEADERS_FLAGS
         "--include-prefix" ${FLATBUFFERS_GENERATE_HEADERS_INCLUDE_PREFIX})
  endif()

  # Create rules to generate the code for each schema.
  foreach(schema ${FLATBUFFERS_GENERATE_HEADERS_SCHEMAS})
    get_filename_component(filename ${schema} NAME_WE)
    set(generated_include "${generated_include_dir}/${filename}_generated.h")

    # Generate files for grpc if needed
    set(generated_source_file)
    if("${FLATBUFFERS_GENERATE_HEADERS_FLAGS}" MATCHES "--grpc")
      # Check if schema file contain a rpc_service definition
      file(STRINGS ${schema} has_grpc REGEX "rpc_service")
      if(has_grpc)
        list(APPEND generated_include "${generated_include_dir}/${filename}.grpc.fb.h")
        set(generated_source_file "${generated_include_dir}/${filename}.grpc.fb.cc")
      endif()
    endif()

    add_custom_command(
      OUTPUT ${generated_include} ${generated_source_file}
      COMMAND ${FLATC} ${FLATC_ARGS}
      -o ${generated_include_dir}
      ${include_params}
      -c ${schema}
      ${FLATBUFFERS_GENERATE_HEADERS_FLAGS}
      DEPENDS ${FLATC_TARGET} ${schema}
      WORKING_DIRECTORY "${working_dir}"
      COMMENT "Building ${schema} flatbuffers...")
    list(APPEND all_generated_header_files ${generated_include})
    list(APPEND all_generated_source_files ${generated_source_file})

    # Generate the binary flatbuffers schemas if instructed to.
    if (NOT ${FLATBUFFERS_GENERATE_HEADERS_BINARY_SCHEMAS_DIR} STREQUAL "")
      set(binary_schema
          "${FLATBUFFERS_GENERATE_HEADERS_BINARY_SCHEMAS_DIR}/${filename}.bfbs")
      add_custom_command(
        OUTPUT ${binary_schema}
        COMMAND ${FLATC} -b --schema
        -o ${FLATBUFFERS_GENERATE_HEADERS_BINARY_SCHEMAS_DIR}
        ${include_params}
        ${schema}
        DEPENDS ${FLATC_TARGET} ${schema}
        WORKING_DIRECTORY "${working_dir}")
      list(APPEND all_generated_binary_files ${binary_schema})
    endif()
  endforeach()

  # Set up interface library
  add_library(${FLATBUFFERS_GENERATE_HEADERS_TARGET} INTERFACE)
  target_sources(
    ${FLATBUFFERS_GENERATE_HEADERS_TARGET}
    INTERFACE
      ${all_generated_header_files}
      ${all_generated_binary_files}
      ${all_generated_source_files}
      ${FLATBUFFERS_GENERATE_HEADERS_SCHEMAS})
  add_dependencies(
    ${FLATBUFFERS_GENERATE_HEADERS_TARGET}
    ${FLATC}
    ${FLATBUFFERS_GENERATE_HEADERS_SCHEMAS})
  target_include_directories(
    ${FLATBUFFERS_GENERATE_HEADERS_TARGET}
    INTERFACE ${generated_target_dir})

  # Organize file layout for IDEs.
  source_group(
    TREE "${generated_target_dir}"
    PREFIX "Flatbuffers/Generated/Headers Files"
    FILES ${all_generated_header_files})
  source_group(
    TREE "${generated_target_dir}"
    PREFIX "Flatbuffers/Generated/Source Files"
    FILES ${all_generated_source_files})
  source_group(
    TREE ${working_dir}
    PREFIX "Flatbuffers/Schemas"
    FILES ${FLATBUFFERS_GENERATE_HEADERS_SCHEMAS})
  if (NOT ${FLATBUFFERS_GENERATE_HEADERS_BINARY_SCHEMAS_DIR} STREQUAL "")
    source_group(
      TREE "${FLATBUFFERS_GENERATE_HEADERS_BINARY_SCHEMAS_DIR}"
      PREFIX "Flatbuffers/Generated/Binary Schemas"
      FILES ${all_generated_binary_files})
  endif()
endfunction()

# Creates a target that can be linked against that generates flatbuffer binaries
# from json files.
#
# This function takes a target name and a list of schemas and Json files. You
# can also specify other flagc flags and options to change the behavior of the
# flatc compiler.
#
# Adding this target to your executable ensurses that the flatbuffer binaries
# are compiled before your executable is run.
#
# Arguments:
#   TARGET: The name of the target to generate.
#   JSON_FILES: The list of json files to compile to flatbuffers binaries.
#   SCHEMA: The flatbuffers schema of the Json files to be compiled.
#   INCLUDE: Optional. Search for includes in the specified paths. (Use this
#       instead of "-I <path>" and the FLAGS option so that CMake is aware of
#       the directories that need to be searched).
#   OUTPUT_DIR: The directly where the generated flatbuffers binaries should be
#       placed.
#   FLAGS: Optional. A list of any additional flags that you would like to pass
#       to flatc.
#
# Example:
#
#     flatbuffers_generate_binary_files(
#         TARGET my_binary_data
#         SCHEMA "${MY_SCHEMA_DIR}/my_example_schema.fbs"
#         JSON_FILES ${MY_JSON_FILES}
#         OUTPUT_DIR "${MY_BINARY_DATA_DIRECTORY}"
#         FLAGS --strict-json)
#
#     target_link_libraries(MyExecutableTarget
#         PRIVATE my_binary_data
#     )
function(flatbuffers_generate_binary_files)
  # Parse function arguments.
  set(options)
  set(one_value_args
    "TARGET"
    "SCHEMA"
    "OUTPUT_DIR")
  set(multi_value_args
    "JSON_FILES"
    "INCLUDE"
    "FLAGS")
  cmake_parse_arguments(
    PARSE_ARGV 0
    FLATBUFFERS_GENERATE_BINARY_FILES
    "${options}"
    "${one_value_args}"
    "${multi_value_args}")

  # Test if including from FindFlatBuffers
  if(FLATBUFFERS_FLATC_EXECUTABLE)
    set(FLATC_TARGET "")
    set(FLATC ${FLATBUFFERS_FLATC_EXECUTABLE})
  else()
    set(FLATC_TARGET flatc)
    set(FLATC flatc)
  endif()

  set(working_dir "${CMAKE_CURRENT_SOURCE_DIR}")

  # Generate the include files parameters.
  set(include_params "")
  foreach (include_dir ${FLATBUFFERS_GENERATE_BINARY_FILES_INCLUDE})
    set(include_params -I ${include_dir} ${include_params})
  endforeach()

  # Create rules to generate the flatbuffers binary for each json file.
  foreach(json_file ${FLATBUFFERS_GENERATE_BINARY_FILES_JSON_FILES})
    get_filename_component(filename ${json_file} NAME_WE)
    set(generated_binary_file "${FLATBUFFERS_GENERATE_BINARY_FILES_OUTPUT_DIR}/${filename}.bin")
    add_custom_command(
      OUTPUT ${generated_binary_file}
      COMMAND ${FLATC} ${FLATC_ARGS}
      -o ${FLATBUFFERS_GENERATE_BINARY_FILES_OUTPUT_DIR}
      ${include_params}
      -b ${FLATBUFFERS_GENERATE_BINARY_FILES_SCHEMA} ${json_file}
      ${FLATBUFFERS_GENERATE_BINARY_FILES_FLAGS}
      DEPENDS ${FLATC_TARGET} ${json_file}
      WORKING_DIRECTORY "${working_dir}"
      COMMENT "Building ${json_file} binary flatbuffers...")
      list(APPEND all_generated_binary_files ${generated_binary_file})
  endforeach()

  # Set up interface library
  add_library(${FLATBUFFERS_GENERATE_BINARY_FILES_TARGET} INTERFACE)
  target_sources(
    ${FLATBUFFERS_GENERATE_BINARY_FILES_TARGET}
    INTERFACE
      ${all_generated_binary_files}
      ${FLATBUFFERS_GENERATE_BINARY_FILES_JSON_FILES}
      ${FLATBUFFERS_GENERATE_BINARY_FILES_SCHEMA})
  add_dependencies(
    ${FLATBUFFERS_GENERATE_BINARY_FILES_TARGET}
    ${FLATC})

  # Organize file layout for IDEs.
  source_group(
    TREE ${working_dir}
    PREFIX "Flatbuffers/JSON Files"
    FILES ${FLATBUFFERS_GENERATE_BINARY_FILES_JSON_FILES})
  source_group(
    TREE ${working_dir}
    PREFIX "Flatbuffers/Schemas"
    FILES ${FLATBUFFERS_GENERATE_BINARY_FILES_SCHEMA})
  source_group(
    TREE ${FLATBUFFERS_GENERATE_BINARY_FILES_OUTPUT_DIR}
    PREFIX "Flatbuffers/Generated/Binary Files"
    FILES ${all_generated_binary_files})
endfunction()


================================================
FILE: cmake/Findzstd.cmake
================================================
find_path(ZSTD_INCLUDE_DIR
    NAMES zstd.h
    PATHS
        ${CONAN_INCLUDE_DIRS_RELEASE}
        ${CONAN_INCLUDE_DIRS_DEBUG}
)

set(ZSTD_NAMES zstd zstd_static)
set(ZSTD_NAMES_DEBUG zstdd zstd_staticd)

find_library(ZSTD_LIBRARY_RELEASE
    NAMES ${ZSTD_NAMES}
    PATHS ${CONAN_LIB_DIRS_RELEASE}
)
find_library(ZSTD_LIBRARY_DEBUG
    NAMES
        ${ZSTD_NAMES_DEBUG}
        ${ZSTD_NAMES}
    PATHS ${CONAN_LIB_DIRS_DEBUG}
)

include(SelectLibraryConfigurations)
select_library_configurations(ZSTD)

if(ZSTD_INCLUDE_DIR AND EXISTS "${ZSTD_INCLUDE_DIR}/zstd.h")
    file(STRINGS "${ZSTD_INCLUDE_DIR}/zstd.h" ZSTD_VERSION_MAJOR_LINE REGEX "^#define ZSTD_VERSION_MAJOR.*$")
    file(STRINGS "${ZSTD_INCLUDE_DIR}/zstd.h" ZSTD_VERSION_MINOR_LINE REGEX "^#define ZSTD_VERSION_MINOR.*$")
    file(STRINGS "${ZSTD_INCLUDE_DIR}/zstd.h" ZSTD_VERSION_RELEASE_LINE REGEX "^#define ZSTD_VERSION_RELEASE.*$")

    string(REGEX REPLACE "^.*ZSTD_VERSION_MAJOR *([0-9]+)$" "\\1" ZSTD_VERSION_MAJOR "${ZSTD_VERSION_MAJOR_LINE}")
    string(REGEX REPLACE "^.*ZSTD_VERSION_MINOR *([0-9]+)$" "\\1" ZSTD_VERSION_MINOR "${ZSTD_VERSION_MINOR_LINE}")
    string(REGEX REPLACE "^.*ZSTD_VERSION_RELEASE *([0-9]+)$" "\\1" ZSTD_VERSION_RELEASE "${ZSTD_VERSION_RELEASE_LINE}")

    set(ZSTD_VERSION_STRING "${ZSTD_VERSION_MAJOR}.${ZSTD_VERSION_MINOR}.${ZSTD_VERSION_RELEASE}")
endif()

# handle the QUIETLY and REQUIRED arguments and set ZLIB_FOUND to TRUE if
# all listed variables are TRUE
include(FindPackageHandleStandardArgs)
find_package_handle_standard_args(zstd REQUIRED_VARS ZSTD_LIBRARY ZSTD_INCLUDE_DIR
                                       VERSION_VAR ZSTD_VERSION_STRING)


if (ZSTD_FOUND)
    set(ZSTD_INCLUDE_DIRS ${ZSTD_INCLUDE_DIR})

    if (NOT ZSTD_LIBRARIES)
        set(ZSTD_LIBRARIES ${ZSTD_LIBRARY})
    endif()

    if (NOT TARGET zstd::zstd)
        add_library(zstd::zstd UNKNOWN IMPORTED)
        set_target_properties(zstd::zstd PROPERTIES
            INTERFACE_INCLUDE_DIRECTORIES "${ZSTD_INCLUDE_DIRS}")

        if(ZSTD_LIBRARY_RELEASE)
            set_property(TARGET zstd::zstd APPEND PROPERTY
                IMPORTED_CONFIGURATIONS RELEASE)
            set_target_properties(zstd::zstd PROPERTIES
                IMPORTED_LOCATION_RELEASE "${ZSTD_LIBRARY_RELEASE}")
        endif()

        if(ZSTD_LIBRARY_DEBUG)
            set_property(TARGET zstd::zstd APPEND PROPERTY
                IMPORTED_CONFIGURATIONS DEBUG)
            set_target_properties(zstd::zstd PROPERTIES
                IMPORTED_LOCATION_DEBUG "${ZSTD_LIBRARY_DEBUG}")
        endif()

        if(NOT ZSTD_LIBRARY_RELEASE AND NOT ZSTD_LIBRARY_DEBUG)
            set_property(TARGET zstd::zstd APPEND PROPERTY
                IMPORTED_LOCATION "${ZSTD_LIBRARY}")
        endif()
    endif()
endif()


================================================
FILE: cmake/conan_provider.cmake
================================================
# The MIT License (MIT)
#
# Copyright (c) 2024 JFrog
#
# Permission is hereby granted, free of charge, to any person obtaining a copy
# of this software and associated documentation files (the "Software"), to deal
# in the Software without restriction, including without limitation the rights
# to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
# copies of the Software, and to permit persons to whom the Software is
# furnished to do so, subject to the following conditions:
#
# The above copyright notice and this permission notice shall be included in all
# copies or substantial portions of the Software.
#
# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
# AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
# OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
# SOFTWARE.

set(CONAN_MINIMUM_VERSION 2.0.5)

# Create a new policy scope and set the minimum required cmake version so the
# features behind a policy setting like if(... IN_LIST ...) behaves as expected
# even if the parent project does not specify a minimum cmake version or a minimum
# version less than this module requires (e.g. 3.0) before the first project() call.
# (see: https://cmake.org/cmake/help/latest/variable/CMAKE_PROJECT_TOP_LEVEL_INCLUDES.html)
#
# The policy-affecting calls like cmake_policy(SET...) or `cmake_minimum_required` only
# affects the current policy scope, i.e. between the PUSH and POP in this case.
#
# https://cmake.org/cmake/help/book/mastering-cmake/chapter/Policies.html#the-policy-stack
cmake_policy(PUSH)
cmake_minimum_required(VERSION 3.24)


function(detect_os os os_api_level os_sdk os_subsystem os_version)
    # it could be cross compilation
    message(STATUS "CMake-Conan: cmake_system_name=${CMAKE_SYSTEM_NAME}")
    if(CMAKE_SYSTEM_NAME AND NOT CMAKE_SYSTEM_NAME STREQUAL "Generic")
        if(CMAKE_SYSTEM_NAME STREQUAL "Darwin")
            set(${os} Macos PARENT_SCOPE)
        elseif(CMAKE_SYSTEM_NAME STREQUAL "QNX")
            set(${os} Neutrino PARENT_SCOPE)
        elseif(CMAKE_SYSTEM_NAME STREQUAL "CYGWIN")
            set(${os} Windows PARENT_SCOPE)
            set(${os_subsystem} cygwin PARENT_SCOPE)
        elseif(CMAKE_SYSTEM_NAME MATCHES "^MSYS")
            set(${os} Windows PARENT_SCOPE)
            set(${os_subsystem} msys2 PARENT_SCOPE)
        elseif(CMAKE_SYSTEM_NAME STREQUAL "Emscripten")
            # https://github.com/emscripten-core/emscripten/blob/4.0.6/cmake/Modules/Platform/Emscripten.cmake#L17C1-L17C34
            set(${os} Emscripten PARENT_SCOPE)
        else()
            set(${os} ${CMAKE_SYSTEM_NAME} PARENT_SCOPE)
        endif()
        if(CMAKE_SYSTEM_NAME STREQUAL "Android")
            if(DEFINED ANDROID_PLATFORM)
                string(REGEX MATCH "[0-9]+" _os_api_level ${ANDROID_PLATFORM})
            elseif(DEFINED CMAKE_SYSTEM_VERSION)
                set(_os_api_level ${CMAKE_SYSTEM_VERSION})
            endif()
            message(STATUS "CMake-Conan: android api level=${_os_api_level}")
            set(${os_api_level} ${_os_api_level} PARENT_SCOPE)
        endif()
        if(CMAKE_SYSTEM_NAME MATCHES "Darwin|iOS|tvOS|watchOS")
            # CMAKE_OSX_SYSROOT contains the full path to the SDK for MakeFile/Ninja
            # generators, but just has the original input string for Xcode.
            if(NOT IS_DIRECTORY ${CMAKE_OSX_SYSROOT})
                set(_os_sdk ${CMAKE_OSX_SYSROOT})
            else()
                if(CMAKE_OSX_SYSROOT MATCHES Simulator)
                    set(apple_platform_suffix simulator)
                else()
                    set(apple_platform_suffix os)
                endif()
                if(CMAKE_OSX_SYSROOT MATCHES AppleTV)
                    set(_os_sdk "appletv${apple_platform_suffix}")
                elseif(CMAKE_OSX_SYSROOT MATCHES iPhone)
                    set(_os_sdk "iphone${apple_platform_suffix}")
                elseif(CMAKE_OSX_SYSROOT MATCHES Watch)
                    set(_os_sdk "watch${apple_platform_suffix}")
                endif()
            endif()
            if(DEFINED os_sdk)
                message(STATUS "CMake-Conan: cmake_osx_sysroot=${CMAKE_OSX_SYSROOT}")
                set(${os_sdk} ${_os_sdk} PARENT_SCOPE)
            endif()
            if(DEFINED CMAKE_OSX_DEPLOYMENT_TARGET)
                message(STATUS "CMake-Conan: cmake_osx_deployment_target=${CMAKE_OSX_DEPLOYMENT_TARGET}")
                set(${os_version} ${CMAKE_OSX_DEPLOYMENT_TARGET} PARENT_SCOPE)
            endif()
        endif()
    endif()
endfunction()


function(detect_arch arch)
    # CMAKE_OSX_ARCHITECTURES can contain multiple architectures, but Conan only supports one.
    # Therefore this code only finds one. If the recipes support multiple architectures, the
    # build will work. Otherwise, there will be a linker error for the missing architecture(s).
    if(DEFINED CMAKE_OSX_ARCHITECTURES)
        string(REPLACE " " ";" apple_arch_list "${CMAKE_OSX_ARCHITECTURES}")
        list(LENGTH apple_arch_list apple_arch_count)
        if(apple_arch_count GREATER 1)
            message(WARNING "CMake-Conan: Multiple architectures detected, this will only work if Conan recipe(s) produce fat binaries.")
        endif()
    endif()
    if(CMAKE_SYSTEM_NAME MATCHES "Darwin|iOS|tvOS|watchOS" AND NOT CMAKE_OSX_ARCHITECTURES STREQUAL "")
        set(host_arch ${CMAKE_OSX_ARCHITECTURES})
    elseif(MSVC)
        set(host_arch ${CMAKE_CXX_COMPILER_ARCHITECTURE_ID})
    else()
        set(host_arch ${CMAKE_SYSTEM_PROCESSOR})
    endif()
    if(host_arch MATCHES "aarch64|arm64|ARM64")
        set(_arch armv8)
    elseif(host_arch MATCHES "armv7|armv7-a|armv7l|ARMV7")
        set(_arch armv7)
    elseif(host_arch MATCHES armv7s)
        set(_arch armv7s)
    elseif(host_arch MATCHES "i686|i386|X86")
        set(_arch x86)
    elseif(host_arch MATCHES "AMD64|amd64|x86_64|x64")
        set(_arch x86_64)
    endif()
    if(EMSCRIPTEN)
        # https://github.com/emscripten-core/emscripten/blob/4.0.6/cmake/Modules/Platform/Emscripten.cmake#L294C1-L294C80
        set(_arch wasm)
    endif()
    message(STATUS "CMake-Conan: cmake_system_processor=${_arch}")
    set(${arch} ${_arch} PARENT_SCOPE)
endfunction()


function(detect_cxx_standard cxx_standard)
    set(${cxx_standard} ${CMAKE_CXX_STANDARD} PARENT_SCOPE)
    if(CMAKE_CXX_EXTENSIONS)
        set(${cxx_standard} "gnu${CMAKE_CXX_STANDARD}" PARENT_SCOPE)
    endif()
endfunction()


macro(detect_gnu_libstdcxx)
    # _conan_is_gnu_libstdcxx true if GNU libstdc++
    check_cxx_source_compiles("
    #include <cstddef>
    #if !defined(__GLIBCXX__) && !defined(__GLIBCPP__)
    static_assert(false);
    #endif
    int main(){}" _conan_is_gnu_libstdcxx)

    # _conan_gnu_libstdcxx_is_cxx11_abi true if C++11 ABI
    check_cxx_source_compiles("
    #include <string>
    static_assert(sizeof(std::string) != sizeof(void*), \"using libstdc++\");
    int main () {}" _conan_gnu_libstdcxx_is_cxx11_abi)

    set(_conan_gnu_libstdcxx_suffix "")
    if(_conan_gnu_libstdcxx_is_cxx11_abi)
        set(_conan_gnu_libstdcxx_suffix "11")
    endif()
    unset (_conan_gnu_libstdcxx_is_cxx11_abi)
endmacro()


macro(detect_libcxx)
    # _conan_is_libcxx true if LLVM libc++
    check_cxx_source_compiles("
    #include <cstddef>
    #if !defined(_LIBCPP_VERSION)
       static_assert(false);
    #endif
    int main(){}" _conan_is_libcxx)
endmacro()


function(detect_lib_cxx lib_cxx)
    if(CMAKE_SYSTEM_NAME STREQUAL "Android")
        message(STATUS "CMake-Conan: android_stl=${CMAKE_ANDROID_STL_TYPE}")
        set(${lib_cxx} ${CMAKE_ANDROID_STL_TYPE} PARENT_SCOPE)
        return()
    endif()

    include(CheckCXXSourceCompiles)

    if(CMAKE_CXX_COMPILER_ID MATCHES "GNU")
        detect_gnu_libstdcxx()
        set(${lib_cxx} "libstdc++${_conan_gnu_libstdcxx_suffix}" PARENT_SCOPE)
    elseif(CMAKE_CXX_COMPILER_ID MATCHES "AppleClang")
        set(${lib_cxx} "libc++" PARENT_SCOPE)
    elseif(CMAKE_CXX_COMPILER_ID MATCHES "Clang" AND NOT CMAKE_SYSTEM_NAME MATCHES "Windows")
        # Check for libc++
        detect_libcxx()
        if(_conan_is_libcxx)
            set(${lib_cxx} "libc++" PARENT_SCOPE)
            return()
        endif()

        # Check for libstdc++
        detect_gnu_libstdcxx()
        if(_conan_is_gnu_libstdcxx)
            set(${lib_cxx} "libstdc++${_conan_gnu_libstdcxx_suffix}" PARENT_SCOPE)
            return()
        endif()

        # TODO: it would be an error if we reach this point
    elseif(CMAKE_CXX_COMPILER_ID MATCHES "MSVC")
        # Do nothing - compiler.runtime and compiler.runtime_type
        # should be handled separately: https://github.com/conan-io/cmake-conan/pull/516
        return()
    else()
        # TODO: unable to determine, ask user to provide a full profile file instead
    endif()
endfunction()


function(detect_compiler compiler compiler_version compiler_runtime compiler_runtime_type)
    if(DEFINED CMAKE_CXX_COMPILER_ID)
        set(_compiler ${CMAKE_CXX_COMPILER_ID})
        set(_compiler_version ${CMAKE_CXX_COMPILER_VERSION})
    else()
        if(NOT DEFINED CMAKE_C_COMPILER_ID)
            message(FATAL_ERROR "C or C++ compiler not defined")
        endif()
        set(_compiler ${CMAKE_C_COMPILER_ID})
        set(_compiler_version ${CMAKE_C_COMPILER_VERSION})
    endif()

    message(STATUS "CMake-Conan: CMake compiler=${_compiler}")
    message(STATUS "CMake-Conan: CMake compiler version=${_compiler_version}")

    if(_compiler MATCHES MSVC)
        set(_compiler "msvc")
        string(SUBSTRING ${MSVC_VERSION} 0 3 _compiler_version)
        # Configure compiler.runtime and compiler.runtime_type settings for MSVC
        if(CMAKE_MSVC_RUNTIME_LIBRARY)
            set(_msvc_runtime_library ${CMAKE_MSVC_RUNTIME_LIBRARY})
        else()
            set(_msvc_runtime_library MultiThreaded$<$<CONFIG:Debug>:Debug>DLL) # default value documented by CMake
        endif()

        set(_KNOWN_MSVC_RUNTIME_VALUES "")
        list(APPEND _KNOWN_MSVC_RUNTIME_VALUES MultiThreaded MultiThreadedDLL)
        list(APPEND _KNOWN_MSVC_RUNTIME_VALUES MultiThreadedDebug MultiThreadedDebugDLL)
        list(APPEND _KNOWN_MSVC_RUNTIME_VALUES MultiThreaded$<$<CONFIG:Debug>:Debug> MultiThreaded$<$<CONFIG:Debug>:Debug>DLL)

        # only accept the 6 possible values, otherwise we don't don't know to map this
        if(NOT _msvc_runtime_library IN_LIST _KNOWN_MSVC_RUNTIME_VALUES)
            message(FATAL_ERROR "CMake-Conan: unable to map MSVC runtime: ${_msvc_runtime_library} to Conan settings")
        endif()

        # Runtime is "dynamic" in all cases if it ends in DLL
        if(_msvc_runtime_library MATCHES ".*DLL$")
            set(_compiler_runtime "dynamic")
        else()
            set(_compiler_runtime "static")
        endif()
        message(STATUS "CMake-Conan: CMake compiler.runtime=${_compiler_runtime}")

        # Only define compiler.runtime_type when explicitly requested
        # If a generator expression is used, let Conan handle it conditional on build_type
        if(NOT _msvc_runtime_library MATCHES "<CONFIG:Debug>:Debug>")
            if(_msvc_runtime_library MATCHES "Debug")
                set(_compiler_runtime_type "Debug")
            else()
                set(_compiler_runtime_type "Release")
            endif()
            message(STATUS "CMake-Conan: CMake compiler.runtime_type=${_compiler_runtime_type}")
        endif()

        unset(_KNOWN_MSVC_RUNTIME_VALUES)

    elseif(_compiler MATCHES AppleClang)
        set(_compiler "apple-clang")
        string(REPLACE "." ";" VERSION_LIST ${_compiler_version})
        list(GET VERSION_LIST 0 _compiler_version)
    elseif(_compiler MATCHES Clang)
        set(_compiler "clang")
        string(REPLACE "." ";" VERSION_LIST ${_compiler_version})
        list(GET VERSION_LIST 0 _compiler_version)
    elseif(_compiler MATCHES GNU)
        set(_compiler "gcc")
        string(REPLACE "." ";" VERSION_LIST ${_compiler_version})
        list(GET VERSION_LIST 0 _compiler_version)
    endif()

    message(STATUS "CMake-Conan: [settings] compiler=${_compiler}")
    message(STATUS "CMake-Conan: [settings] compiler.version=${_compiler_version}")
    if (_compiler_runtime)
        message(STATUS "CMake-Conan: [settings] compiler.runtime=${_compiler_runtime}")
    endif()
    if (_compiler_runtime_type)
        message(STATUS "CMake-Conan: [settings] compiler.runtime_type=${_compiler_runtime_type}")
    endif()

    set(${compiler} ${_compiler} PARENT_SCOPE)
    set(${compiler_version} ${_compiler_version} PARENT_SCOPE)
    set(${compiler_runtime} ${_compiler_runtime} PARENT_SCOPE)
    set(${compiler_runtime_type} ${_compiler_runtime_type} PARENT_SCOPE)
endfunction()


function(detect_build_type build_type)
    get_property(multiconfig_generator GLOBAL PROPERTY GENERATOR_IS_MULTI_CONFIG)
    if(NOT multiconfig_generator)
        # Only set when we know we are in a single-configuration generator
        # Note: we may want to fail early if `CMAKE_BUILD_TYPE` is not defined
        set(${build_type} ${CMAKE_BUILD_TYPE} PARENT_SCOPE)
    endif()
endfunction()


macro(set_conan_compiler_if_appleclang lang command output_variable)
    if(CMAKE_${lang}_COMPILER_ID STREQUAL "AppleClang")
        execute_process(COMMAND xcrun --find ${command}
            OUTPUT_VARIABLE _xcrun_out OUTPUT_STRIP_TRAILING_WHITESPACE)
        cmake_path(GET _xcrun_out PARENT_PATH _xcrun_toolchain_path)
        cmake_path(GET CMAKE_${lang}_COMPILER PARENT_PATH _compiler_parent_path)
        if ("${_xcrun_toolchain_path}" STREQUAL "${_compiler_parent_path}")
            set(${output_variable} "")
        endif()
        unset(_xcrun_out)
        unset(_xcrun_toolchain_path)
        unset(_compiler_parent_path)
    endif()
endmacro()


macro(append_compiler_executables_configuration)
    set(_conan_c_compiler "")
    set(_conan_cpp_compiler "")
    set(_conan_rc_compiler "")
    set(_conan_compilers_list "")
    if(CMAKE_C_COMPILER)
        set(_conan_c_compiler "\"c\":\"${CMAKE_C_COMPILER}\"")
        set_conan_compiler_if_appleclang(C cc _conan_c_compiler)
        list(APPEND _conan_compilers_list ${_conan_c_compiler})
    else()
        message(WARNING "CMake-Conan: The C compiler is not defined. "
                        "Please define CMAKE_C_COMPILER or enable the C language.")
    endif()
    if(CMAKE_CXX_COMPILER)
        set(_conan_cpp_compiler "\"cpp\":\"${CMAKE_CXX_COMPILER}\"")
        set_conan_compiler_if_appleclang(CXX c++ _conan_cpp_compiler)
        list(APPEND _conan_compilers_list ${_conan_cpp_compiler})
    else()
        message(WARNING "CMake-Conan: The C++ compiler is not defined. "
                        "Please define CMAKE_CXX_COMPILER or enable the C++ language.")
    endif()
    if(CMAKE_RC_COMPILER)
        set(_conan_rc_compiler "\"rc\":\"${CMAKE_RC_COMPILER}\"")
        list(APPEND _conan_compilers_list ${_conan_rc_compiler})
        # Not necessary to warn if RC not defined
    endif()
    if(NOT "x${_conan_compilers_list}" STREQUAL "x")
        string(REPLACE ";" "," _conan_compilers_list "${_conan_compilers_list}")
        string(APPEND profile "tools.build:compiler_executables={${_conan_compilers_list}}\n")
    endif()
    unset(_conan_c_compiler)
    unset(_conan_cpp_compiler)
    unset(_conan_rc_compiler)
    unset(_conan_compilers_list)
endmacro()


function(detect_host_profile output_file)
    detect_os(os os_api_level os_sdk os_subsystem os_version)
    detect_arch(arch)
    detect_compiler(compiler compiler_version compiler_runtime compiler_runtime_type)
    detect_cxx_standard(compiler_cppstd)
    detect_lib_cxx(compiler_libcxx)
    detect_build_type(build_type)

    set(profile "")
    string(APPEND profile "[settings]\n")
    if(arch)
        string(APPEND profile arch=${arch} "\n")
    endif()
    if(os)
        string(APPEND profile os=${os} "\n")
    endif()
    if(os_api_level)
        string(APPEND profile os.api_level=${os_api_level} "\n")
    endif()
    if(os_version)
        string(APPEND profile os.version=${os_version} "\n")
    endif()
    if(os_sdk)
        string(APPEND profile os.sdk=${os_sdk} "\n")
    endif()
    if(os_subsystem)
        string(APPEND profile os.subsystem=${os_subsystem} "\n")
    endif()
    if(compiler)
        string(APPEND profile compiler=${compiler} "\n")
    endif()
    if(compiler_version)
        string(APPEND profile compiler.version=${compiler_version} "\n")
    endif()
    if(compiler_runtime)
        string(APPEND profile compiler.runtime=${compiler_runtime} "\n")
    endif()
    if(compiler_runtime_type)
        string(APPEND profile compiler.runtime_type=${compiler_runtime_type} "\n")
    endif()
    if(compiler_cppstd)
        string(APPEND profile compiler.cppstd=${compiler_cppstd} "\n")
    endif()
    if(compiler_libcxx)
        string(APPEND profile compiler.libcxx=${compiler_libcxx} "\n")
    endif()
    if(build_type)
        string(APPEND profile "build_type=${build_type}\n")
    endif()

    if(NOT DEFINED output_file)
        set(file_name "${CMAKE_BINARY_DIR}/profile")
    else()
        set(file_name ${output_file})
    endif()

    string(APPEND profile "[conf]\n")
    string(APPEND profile "tools.cmake.cmaketoolchain:generator=${CMAKE_GENERATOR}\n")

    # propagate compilers via profile
    append_compiler_executables_configuration()

    if(os STREQUAL "Android")
        string(APPEND profile "tools.android:ndk_path=${CMAKE_ANDROID_NDK}\n")
    endif()

    message(STATUS "CMake-Conan: Creating profile ${file_name}")
    file(WRITE ${file_name} ${profile})
    message(STATUS "CMake-Conan: Profile: \n${profile}")
endfunction()


function(conan_profile_detect_default)
    message(STATUS "CMake-Conan: Checking if a default profile exists")
    execute_process(COMMAND ${CONAN_COMMAND} profile path default
                    RESULT_VARIABLE return_code
                    OUTPUT_VARIABLE conan_stdout
                    ERROR_VARIABLE conan_stderr
                    ECHO_ERROR_VARIABLE    # show the text output regardless
                    ECHO_OUTPUT_VARIABLE
                    WORKING_DIRECTORY ${CMAKE_CURRENT_BINARY_DIR})
    if(NOT ${return_code} EQUAL "0")
        message(STATUS "CMake-Conan: The default profile doesn't exist, detecting it.")
        execute_process(COMMAND ${CONAN_COMMAND} profile detect
            RESULT_VARIABLE return_code
            OUTPUT_VARIABLE conan_stdout
            ERROR_VARIABLE conan_stderr
            ECHO_ERROR_VARIABLE    # show the text output regardless
            ECHO_OUTPUT_VARIABLE
            WORKING_DIRECTORY ${CMAKE_CURRENT_BINARY_DIR})
    endif()
endfunction()


function(conan_install)
    cmake_parse_arguments(ARGS conan_args ${ARGN})
    set(conan_output_folder ${CMAKE_BINARY_DIR}/conan)
    # Invoke "conan install" with the provided arguments
    set(conan_args ${conan_args} -of=${conan_output_folder})
    message(STATUS "CMake-Conan: conan install ${CMAKE_SOURCE_DIR} ${conan_args} ${ARGN}")


    # In case there was not a valid cmake executable in the PATH, we inject the
    # same we used to invoke the provider to the PATH
    if(DEFINED PATH_TO_CMAKE_BIN)
        set(old_path $ENV{PATH})
        set(ENV{PATH} "$ENV{PATH}:${PATH_TO_CMAKE_BIN}")
    endif()

    execute_process(COMMAND ${CONAN_COMMAND} install ${CMAKE_SOURCE_DIR} ${conan_args} ${ARGN} --format=json
                    RESULT_VARIABLE return_code
                    OUTPUT_VARIABLE conan_stdout
                    ERROR_VARIABLE conan_stderr
                    ECHO_ERROR_VARIABLE    # show the text output regardless
                    WORKING_DIRECTORY ${CMAKE_CURRENT_BINARY_DIR})

    if(DEFINED PATH_TO_CMAKE_BIN)
        set(ENV{PATH} "${old_path}")
    endif()

    if(NOT "${return_code}" STREQUAL "0")
        message(FATAL_ERROR "Conan install failed='${return_code}'")
    endif()

    # the files are generated in a folder that depends on the layout used, if
    # one is specified, but we don't know a priori where this is.
    # TODO: this can be made more robust if Conan can provide this in the json output
    string(JSON conan_generators_folder GET "${conan_stdout}" graph nodes 0 generators_folder)
    cmake_path(CONVERT ${conan_generators_folder} TO_CMAKE_PATH_LIST conan_generators_folder)

    message(STATUS "CMake-Conan: CONAN_GENERATORS_FOLDER=${conan_generators_folder}")
    set_property(GLOBAL PROPERTY CONAN_GENERATORS_FOLDER "${conan_generators_folder}")
    # reconfigure on conanfile changes
    string(JSON conanfile GET "${conan_stdout}" graph nodes 0 label)
    message(STATUS "CMake-Conan: CONANFILE=${CMAKE_SOURCE_DIR}/${conanfile}")
    set_property(DIRECTORY ${CMAKE_SOURCE_DIR} APPEND PROPERTY CMAKE_CONFIGURE_DEPENDS "${CMAKE_SOURCE_DIR}/${conanfile}")
    # success
    set_property(GLOBAL PROPERTY CONAN_INSTALL_SUCCESS TRUE)

endfunction()


function(conan_get_version conan_command conan_current_version)
    execute_process(
        COMMAND ${conan_command} --version
        OUTPUT_VARIABLE conan_output
        RESULT_VARIABLE conan_result
        OUTPUT_STRIP_TRAILING_WHITESPACE
    )
    if(conan_result)
        message(FATAL_ERROR "CMake-Conan: Error when trying to run Conan")
    endif()

    string(REGEX MATCH "[0-9]+\\.[0-9]+\\.[0-9]+" conan_version ${conan_output})
    set(${conan_current_version} ${conan_version} PARENT_SCOPE)
endfunction()


function(conan_version_check)
    set(options )
    set(one_value_args MINIMUM CURRENT)
    set(multi_value_args )
    cmake_parse_arguments(conan_version_check
        "${options}" "${one_value_args}" "${multi_value_args}" ${ARGN})

    if(NOT conan_version_check_MINIMUM)
        message(FATAL_ERROR "CMake-Conan: Required parameter MINIMUM not set!")
    endif()
        if(NOT conan_version_check_CURRENT)
        message(FATAL_ERROR "CMake-Conan: Required parameter CURRENT not set!")
    endif()

    if(conan_version_check_CURRENT VERSION_LESS conan_version_check_MINIMUM)
        message(FATAL_ERROR "CMake-Conan: Conan version must be ${conan_version_check_MINIMUM} or later")
    endif()
endfunction()


macro(construct_profile_argument argument_variable profile_list)
    set(${argument_variable} "")
    if("${profile_list}" STREQUAL "CONAN_HOST_PROFILE")
        set(_arg_flag "--profile:host=")
    elseif("${profile_list}" STREQUAL "CONAN_BUILD_PROFILE")
        set(_arg_flag "--profile:build=")
    endif()

    set(_profile_list "${${profile_list}}")
    list(TRANSFORM _profile_list REPLACE "auto-cmake" "${CMAKE_BINARY_DIR}/conan_host_profile")
    list(TRANSFORM _profile_list PREPEND ${_arg_flag})
    set(${argument_variable} ${_profile_list})

    unset(_arg_flag)
    unset(_profile_list)
endmacro()


macro(conan_provide_dependency method package_name)
    set_property(GLOBAL PROPERTY CONAN_PROVIDE_DEPENDENCY_INVOKED TRUE)
    get_property(_conan_install_success GLOBAL PROPERTY CONAN_INSTALL_SUCCESS)
    if(NOT _conan_install_success)
        find_program(CONAN_COMMAND "conan" REQUIRED)
        conan_get_version(${CONAN_COMMAND} CONAN_CURRENT_VERSION)
        conan_version_check(MINIMUM ${CONAN_MINIMUM_VERSION} CURRENT ${CONAN_CURRENT_VERSION})
        message(STATUS "CMake-Conan: first find_package() found. Installing dependencies with Conan")
        if("default" IN_LIST CONAN_HOST_PROFILE OR "default" IN_LIST CONAN_BUILD_PROFILE)
            conan_profile_detect_default()
        endif()
        if("auto-cmake" IN_LIST CONAN_HOST_PROFILE)
            detect_host_profile(${CMAKE_BINARY_DIR}/conan_host_profile)
        endif()
        construct_profile_argument(_host_profile_flags CONAN_HOST_PROFILE)
        construct_profile_argument(_build_profile_flags CONAN_BUILD_PROFILE)
        if(EXISTS "${CMAKE_SOURCE_DIR}/conanfile.py")
            file(READ "${CMAKE_SOURCE_DIR}/conanfile.py" outfile)
            if(NOT "${outfile}" MATCHES ".*CMakeDeps.*")
                message(WARNING "Cmake-conan: CMakeDeps generator was not defined in the conanfile")
            endif()
            set(generator "")
        elseif (EXISTS "${CMAKE_SOURCE_DIR}/conanfile.txt")
            file(READ "${CMAKE_SOURCE_DIR}/conanfile.txt" outfile)
            if(NOT "${outfile}" MATCHES ".*CMakeDeps.*")
                message(WARNING "Cmake-conan: CMakeDeps generator was not defined in the conanfile. "
                        "Please define the generator as it will be mandatory in the future")
            endif()
            set(generator "-g;CMakeDeps")
        endif()
        get_property(_multiconfig_generator GLOBAL PROPERTY GENERATOR_IS_MULTI_CONFIG)
        if(NOT _multiconfig_generator)
            message(STATUS "CMake-Conan: Installing single configuration ${CMAKE_BUILD_TYPE}")
            conan_install(${_host_profile_flags} ${_build_profile_flags} ${CONAN_INSTALL_ARGS} ${generator})
        else()
            message(STATUS "CMake-Conan: Installing both Debug and Release")
            conan_install(${_host_profile_flags} ${_build_profile_flags} -s build_type=Release ${CONAN_INSTALL_ARGS} ${generator})
            conan_install(${_host_profile_flags} ${_build_profile_flags} -s build_type=Debug ${CONAN_INSTALL_ARGS} ${generator})
        endif()
        unset(_host_profile_flags)
        unset(_build_profile_flags)
        unset(_multiconfig_generator)
        unset(_conan_install_success)
    else()
        message(STATUS "CMake-Conan: find_package(${ARGV1}) found, 'conan install' already ran")
        unset(_conan_install_success)
    endif()

    get_property(_conan_generators_folder GLOBAL PROPERTY CONAN_GENERATORS_FOLDER)

    # Ensure that we consider Conan-provided packages ahead of any other,
    # irrespective of other settings that modify the search order or search paths
    # This follows the guidelines from the find_package documentation
    #  (https://cmake.org/cmake/help/latest/command/find_package.html):
    #       find_package (<PackageName> PATHS paths... NO_DEFAULT_PATH)
    #       find_package (<PackageName>)

    # Filter out `REQUIRED` from the argument list, as the first call may fail
    set(_find_args_${package_name} "${ARGN}")
    list(REMOVE_ITEM _find_args_${package_name} "REQUIRED")
    if(NOT "MODULE" IN_LIST _find_args_${package_name})
        find_package(${package_name} ${_find_args_${package_name}} BYPASS_PROVIDER PATHS "${_conan_generators_folder}" NO_DEFAULT_PATH NO_CMAKE_FIND_ROOT_PATH)
        unset(_find_args_${package_name})
    endif()

    # Invoke find_package a second time - if the first call succeeded,
    # this will simply reuse the result. If not, fall back to CMake default search
    # behaviour, also allowing modules to be searched.
    if(NOT ${package_name}_FOUND)
        list(FIND CMAKE_MODULE_PATH "${_conan_generators_folder}" _index)
        if(_index EQUAL -1)
            list(PREPEND CMAKE_MODULE_PATH "${_conan_generators_folder}")
        endif()
        unset(_index)
        find_package(${package_name} ${ARGN} BYPASS_PROVIDER)
        list(REMOVE_ITEM CMAKE_MODULE_PATH "${_conan_generators_folder}")
    endif()
endmacro()


cmake_language(
    SET_DEPENDENCY_PROVIDER conan_provide_dependency
    SUPPORTED_METHODS FIND_PACKAGE
)


macro(conan_provide_dependency_check)
    set(_conan_provide_dependency_invoked FALSE)
    get_property(_conan_provide_dependency_invoked GLOBAL PROPERTY CONAN_PROVIDE_DEPENDENCY_INVOKED)
    if(NOT _conan_provide_dependency_invoked)
        message(WARNING "Conan is correctly configured as dependency provider, "
                        "but Conan has not been invoked. Please add at least one "
                        "call to `find_package()`.")
        if(DEFINED CONAN_COMMAND)
            # suppress warning in case `CONAN_COMMAND` was specified but unused.
            set(_conan_command ${CONAN_COMMAND})
            unset(_conan_command)
        endif()
    endif()
    unset(_conan_provide_dependency_invoked)
endmacro()


# Add a deferred call at the end of processing the top-level directory
# to check if the dependency provider was invoked at all.
cmake_language(DEFER DIRECTORY "${CMAKE_SOURCE_DIR}" CALL conan_provide_dependency_check)

# Configurable variables for Conan profiles
set(CONAN_HOST_PROFILE "default;auto-cmake" CACHE STRING "Conan host profile")
set(CONAN_BUILD_PROFILE "default" CACHE STRING "Conan build profile")
set(CONAN_INSTALL_ARGS "--build=missing" CACHE STRING "Command line arguments for conan install")

find_program(_cmake_program NAMES cmake NO_PACKAGE_ROOT_PATH NO_CMAKE_PATH NO_CMAKE_ENVIRONMENT_PATH NO_CMAKE_SYSTEM_PATH NO_CMAKE_FIND_ROOT_PATH)
if(NOT _cmake_program)
    get_filename_component(PATH_TO_CMAKE_BIN "${CMAKE_COMMAND}" DIRECTORY)
    set(PATH_TO_CMAKE_BIN "${PATH_TO_CMAKE_BIN}" CACHE INTERNAL "Path where the CMake executable is")
endif()

cmake_policy(POP)


================================================
FILE: cmake/pod5_fuzz.cmake
================================================
if (NOT CMAKE_CXX_COMPILER_ID MATCHES "Clang")
    message(FATAL_ERROR
        "Only LLVM based compilers are supported for fuzzing. Assuming that "
        "'clang' is install, it can be picked by setting the environment "
        "variables 'CC=clang' and 'CXX=clang++' before invoking cmake."
    )
endif()

# Build everything with fuzzing instrumentation and sanitizers
set(POD5_SANITIZER_FLAGS -fsanitize=address,undefined,fuzzer-no-link)
add_compile_options(-g ${POD5_SANITIZER_FLAGS} -UNDEBUG -O1)
add_link_options(${POD5_SANITIZER_FLAGS})


================================================
FILE: cmake/pod5_packaging.cmake
================================================

set(CPACK_PACKAGE_NAME "lib_pod5")
set(CPACK_PACKAGE_VENDOR "Oxford Nanopore")
set(CPACK_VERBATIM_VARIABLES true)
set(CPACK_PACKAGE_VERSION_MAJOR ${POD5_VERSION_MAJOR})
set(CPACK_PACKAGE_VERSION_MINOR ${POD5_VERSION_MINOR})
set(CPACK_PACKAGE_VERSION_PATCH ${POD5_VERSION_REV})
set(CPACK_RESOURCE_FILE_LICENSE "${CMAKE_SOURCE_DIR}/LICENSE.md")

include(CPack)


================================================
FILE: cmake/presets/conan-build-options.json
================================================
{
    "version": 4,
    "configurePresets": [
        {
            "name": "conan2-debug",
            "binaryDir": "${sourceDir}/build",
            "hidden": true,
            "cacheVariables": {
                "CMAKE_BUILD_TYPE": "Debug"
            },
            "environment": {
                "CONAN_PROFILE_BUILD_TYPE": "Debug"
            }
        },
        {
            "name": "conan2-release",
            "binaryDir": "${sourceDir}/build",
            "hidden": true,
            "cacheVariables": {
                "CMAKE_BUILD_TYPE": "Release"
            },
            "environment": {
                "CONAN_PROFILE_BUILD_TYPE": "Release"
            }
        },
        {
            "name": "conan2-cppstd20",
            "hidden": true,
            "cacheVariables": {
                "CMAKE_CXX_STANDARD": "20"
            },
            "environment": {
                "CONAN_PROFILE_CPPSTD": "20"
            }
        },
        {
            "name": "conan2-cppstd17",
            "hidden": true,
            "cacheVariables": {
                "CMAKE_CXX_STANDARD": "17"
            },
            "environment": {
                "CONAN_PROFILE_CPPSTD": "17"
            }
        }
    ]
}


================================================
FILE: cmake/presets/conan-profiles.json
================================================
{
    "version": 4,
    "configurePresets": [
        {
            "name": "conan2-gcc9-x86_64-profile",
            "hidden": true,
            "cacheVariables": {
                "CONAN_HOST_PROFILE": "linux-x86_64-gcc9.jinja",
                "CONAN_BUILD_PROFILE": "linux-x86_64-gcc9.jinja"
            }
        },
        {
            "name": "conan2-gcc11-x86_64-profile",
            "hidden": true,
            "cacheVariables": {
                "CONAN_HOST_PROFILE": "linux-x86_64-gcc11.jinja",
                "CONAN_BUILD_PROFILE": "linux-x86_64-gcc11.jinja"
            }
        },
        {
            "name": "conan2-gcc11-asan-static-x86_64-profile",
            "hidden": true,
            "cacheVariables": {
                "CONAN_HOST_PROFILE": "linux-x86_64-gcc11-asan-static.jinja",
                "CONAN_BUILD_PROFILE": "linux-x86_64-gcc11-asan-static.jinja"
            }
        },
        {
            "name": "conan2-gcc11-usan-static-x86_64-profile",
            "hidden": true,
            "cacheVariables": {
                "CONAN_HOST_PROFILE": "linux-x86_64-gcc11-usan-static.jinja",
                "CONAN_BUILD_PROFILE": "linux-x86_64-gcc11-usan-static.jinja"
            }
        },
        {
            "name": "conan2-gcc11-tsan-static-x86_64-profile",
            "hidden": true,
            "cacheVariables": {
                "CONAN_HOST_PROFILE": "linux-x86_64-gcc11-tsan-static.jinja",
                "CONAN_BUILD_PROFILE": "linux-x86_64-gcc11-tsan-static.jinja"
            }
        },
        {
            "name": "conan2-gcc13-x86_64-profile",
            "hidden": true,
            "cacheVariables": {
                "CONAN_HOST_PROFILE": "linux-x86_64-gcc13.jinja",
                "CONAN_BUILD_PROFILE": "linux-x86_64-gcc13.jinja"
            }
        },
        {
            "name": "conan2-gcc13-aarch64-profile",
            "hidden": true,
            "cacheVariables": {
                "CONAN_HOST_PROFILE": "linux-aarch64-gcc13.jinja",
                "CONAN_BUILD_PROFILE": "linux-aarch64-gcc13.jinja"
            }
        },
        {
            "name": "conan2-gcc11-aarch64-profile",
            "hidden": true,
            "cacheVariables": {
                "CONAN_HOST_PROFILE": "linux-aarch64-gcc11.jinja",
                "CONAN_BUILD_PROFILE": "linux-aarch64-gcc11.jinja"
            }
        },
        {
            "name": "conan2-gcc9-aarch64-profile",
            "hidden": true,
            "cacheVariables": {
                "CONAN_HOST_PROFILE": "linux-aarch64-gcc9.jinja",
                "CONAN_BUILD_PROFILE": "linux-aarch64-gcc9.jinja"
            }
        },
        {
            "name": "conan2-appleclang-15.0-aarch64-profile",
            "hidden": true,
            "cacheVariables": {
                "CONAN_HOST_PROFILE": "macos-aarch64-appleclang-15.0.jinja",
                "CONAN_BUILD_PROFILE": "macos-aarch64-appleclang-15.0.jinja"
            }
        },
        {
            "name": "conan2-appleclang-16.0-aarch64-profile",
            "hidden": true,
            "cacheVariables": {
                "CONAN_HOST_PROFILE": "macos-aarch64-appleclang-16.0.jinja",
                "CONAN_BUILD_PROFILE": "macos-aarch64-appleclang-16.0.jinja"
            }
        },
        {
            "name": "conan2-windows-x86_64-vs2019-profile",
            "hidden": true,
            "cacheVariables": {
                "CONAN_HOST_PROFILE": "windows-x86_64-vs2019.jinja",
                "CONAN_BUILD_PROFILE": "windows-x86_64-vs2019.jinja"
            },
            "environment": {
                "CMAKE_GENERATOR": "Visual Studio 16 2019"
            }
        }
    ]
}


================================================
FILE: cmake/presets/conan-provider.json
================================================
{
    "version": 4,
    "configurePresets": [
        {
            "name": "conan2-provider",
            "hidden": true,
            "cacheVariables": {
                "CMAKE_PROJECT_TOP_LEVEL_INCLUDES": "${sourceDir}/cmake/conan_provider.cmake",
                "CONAN2": "ON",
                "CONAN_INSTALL_ARGS":
                    "--build=never;-o:a=arrow/*:with_boost=False;-o:a=arrow/*:with_thrift=False;-o:a=arrow/*:parquet=False;-o:a=arrow/*:with_zstd=True;"
            }
        }
    ]
}


================================================
FILE: conanfile.py
================================================
from conan import ConanFile
from conan.tools.cmake import CMakeToolchain, CMake, CMakeDeps
from conan.tools.files import collect_libs, copy
from conan.tools.build import cross_building
from conan.tools.cmake import cmake_layout
import os


class Pod5Conan(ConanFile):
    name = "pod5_file_format"
    license = "MPL 2.0"
    url = "https://github.com/nanoporetech/pod5-file-format"
    description = "POD5 File format"
    topics = "nanopore", "sequencing", "genomic", "dna", "arrow"
    settings = "os", "compiler", "build_type", "arch"
    options = {"shared": [True, False]}
    default_options = {
        "shared": False,
    }
    exports_sources = [
        "c++/*",
        "cmake/*",
        "python/*",
        "third_party/*",
        "CMakeLists.txt",
        "LICENSE.md",
    ]

    """
    When building a static library, we need to pack arrow, zstd and if on linux jemalloc,
    alongside pod5 static lib to avoid linking errors. This function copies those libs to
    a folder called third_party in the build directory. The ci/install.sh ensures they end
    up in the correct location to be deployed, if install is done via cmake.
    """

    def _setup_third_party_deps_packaging(self):
        deps_to_pack = (
            ["arrow", "zstd", "jemalloc"]
            if self.settings.os == "Linux"
            else ["arrow", "zstd"]
        )
        static_lib_ext_wildcard = "*.a" if self.settings.os != "Windows" else "*.lib"
        for dep in deps_to_pack:
            if dep == "jemalloc":
                static_lib_ext_wildcard = (
                    "*_pic.a" if self.settings.os != "Windows" else "*_pic.lib"
                )
            dep_object = self.dependencies[dep]
            copy(
                self,
                static_lib_ext_wildcard,
                dep_object.cpp_info.libdir,
                f"{self.build_folder}/third_party/libs",
            )

    def _licenses_path(self):
        # This needs to match the install step inside CMake.
        return os.path.join(self.build_folder, "pod5_conan_licenses")

    def _copy_licenses(self):
        # Copy each dependency's licenses.
        for require, dependency in self.dependencies.items():
            # package_folder will be None if this dependency isn't used.
            if dependency.package_folder is not None:
                copy(
                    self,
                    "license*",
                    dependency.package_folder,
                    os.path.join(self._licenses_path(), dependency.ref.name),
                    ignore_case=True,
                )

    def layout(self):
        cmake_layout(self, "Ninja Multi-Config")

    def requirements(self):
        self.requires("arrow/18.0.0")
        self.requires("flatbuffers/2.0.0")
        self.requires("zstd/[>=1.4.8 <=2.0.0]")
        self.requires("zlib/[>=1.2.11 <=2.0.0]")
        if not (
            self.settings.os == "Windows"
            or self.settings.os == "Macos"
            or self.settings.os == "iOS"
        ):
            self.requires("jemalloc/5.2.1")

    """
    When cross compiling we need pre compiled flatbuffers for flatc to run on the build machine
    which is not the target.
    The flatbuffers version is most likely available already; it is on the master branch and
    quite likely already built on the development branch. However, it seems that conan
    doesn't realise this since it is the same package that it tries to build, even though it
    is a different revision, flatbuffers on the other hand is downloaded.
    """

    def build_requirements(self):
        if hasattr(self, "settings_build") and cross_building(self):
            # We are using an older version of flatbuffers not available on CCI.
            # @TODO: Update to a version that exists in CCI
            # When this line changes a corresponding change in .gitlab-ci.yml is required where this
            # package is uninstalled.
            self.tool_requires("flatbuffers/2.0.0")

    def generate(self):
        if not self.options.shared:
            self._setup_third_party_deps_packaging()

        self._copy_licenses()

        tc = CMakeToolchain(self)
        tc.variables["ENABLE_CONAN"] = "ON"
        tc.variables["BUILD_PYTHON_WHEEL"] = "OFF"
        tc.variables["POD5_DISABLE_TESTS"] = "ON"
        tc.variables["POD5_BUILD_EXAMPLES"] = "OFF"
        tc.variables["BUILD_SHARED_LIB"] = "ON" if self.options.shared else "OFF"

        tc.generate()

        deps = CMakeDeps(self)
        deps.check_components_exist = True

        # This ensures that target names in cmake would be in the form of libname::libname
        deps.set_property("zstd", "cmake_target_name", None)
        deps.generate()

    def build(self):
        cmake = CMake(self)
        cmake.configure()
        cmake.build()

    def package(self):
        cmake = CMake(self)
        cmake.install()

        # Copy the license files
        copy(
            self,
            "*",
            self._licenses_path(),
            os.path.join(self.package_folder, "licenses"),
        )

        # Package the required third party libs after installing pod5 static
        if not self.options.shared:
            src = f"{self.build_folder}/third_party/libs/"
            dst = f"{self.build_folder}/lib/"
            copy(self, "*", src, dst)

    def package_info(self):
        # Note: package_info collects information in self.cpp_info. It is called from the Conan
        # application.
        #
        # This call is made immediately after the pre_package_info hook and before the
        # post_package_info hook. To get more information, we can "import traceback" and "import inspect",
        # then call traceback.print_stack() to print the complete call stack, or examine
        # inspect.stack().
        #
        # The caller has created self.cpp_info with the name set to the name of self, with a rootpath,
        # version and description from self, env_info and user_info set with default values,
        # public_deps set to an array with the names of public requirements in conanfile.requires.items.

        # Additions for this package. Note that everything in requirements needs to be mentioned
        # here. Except for Windows and Macos, jemalloc is also needed.

        self.cpp_info.libs = collect_libs(self)
        self.cpp_info.requires = [
            "arrow::arrow",
            "flatbuffers::flatbuffers",
            "zstd::zstd",
            "zlib::zlib",
        ]

        # Workaround for broken Arrow package - ensure transitive includes are available
        # Since our headers include Arrow headers, we need Arrow's includes to be transitively available
        try:
            arrow_dep = self.dependencies["arrow"]
            arrow_include_path = os.path.join(arrow_dep.package_folder, "include")
            if os.path.exists(arrow_include_path):
                self.cpp_info.includedirs.append(arrow_include_path)
        except Exception:
            # Arrow dependency not found or other issue - let it fail naturally
            pass

        # self.cpp
        if self.settings.os == "Linux":
            self.cpp_info.requires.append("jemalloc::jemalloc")

        if self.settings.os in ["iOS", "Macos"]:
            self.cpp_info.frameworks = ["CoreFoundation"]


================================================
FILE: docs/DESIGN.md
================================================
POD5 File Format Design Details
==============================

## Summary

This file format has the following design goals (roughly in priority order):

- Good write performance for MinKNOW
- Recoverable if the writing process crashes
- Good read performance for downstream tools, including basecall model generation
- Efficient use of space
- Straightforward to implement and maintain
- Extensibility

Note that trade-offs have been made between these goals, but we have mostly aimed to make those run-time decisions.

We have also chosen not to optimise for editing existing files.


### Write performance

The aspects of this format that are designed to maximise write performance are:

- Data can be written sequentially
  - The sequential access pattern makes it easy to use efficient operating system APIs (such as io_uring on Linux)
  - The sequential access pattern helps the operating system's I/O scheduler maximise throughput
- Signal data from different reads can be interleaved, and data streams can be safely abandoned (at the cost of using more space than necessary)
  - This allows MinKNOW to write out data as it arrives, potentially avoiding the need have an intermediate caching format (this file format can be used for the cache and the final output)
- Support for space- and CPU-efficient compression routines (VBZ)
  - This reduces the amount of data that needs to be written, which reduces I/O load

### Recovery

The aspects of this format that are designed to allow for recovery if the writing process crashes are:

- A way to indicate that a file is actually complete as intended (complete files end with a recognisable footer)
- The Apache Feather format can be assembled by reading it sequentially, without using the footer
- The data file format is append-only, which means that once data is recorded it cannot be corrupted by later updates

### Read performance

The aspects of this format that are designed to maximise read performance are:

- The Apache Feather format can be memory mapped and used directly
- Apache Arrow has significant existing engineering work geared around efficient access to data, from the layout of the data itself to the library tooling
- Storing direct information about signal data locations with the row table
  - This allows quick access to a read's data without scanning the data file
- It is possible to only decode part of a long read, due to read data being stored in chunks
  - This is useful for model training
- Read access does not require locking or otherwise modifying the file
  - This allows multi-threaded and multi-process access to a file for reading

### Efficient use of space

The aspects of this format that are designed to maximise use of space are:

- Support for efficient compression routines (VBZ)
- Apache Arrow's support for dictionary encoding
- Apache Arrow's support for compressing buffers with standard compression routines

### Ease of implementation

The aspects of this format that are designed to make the format easy to implement are:

- Relying on an existing, widely-used format (Apache Arrow)

### Extensibility

The aspects of this format that are designed to make the format extensible are:

- Apache Arrow uses a self-describing schema with named columns, so it is straightforward to write code that is resilient in the face of things like additional columns being added.


================================================
FILE: docs/README.md
================================================
Design documentation for POD5
============================

The POD5 file format has been specifically designed to be suitable for Nanopore read data, we had some specific design goals:

Design Goals
------------

The primary purpose of this file format is store reads produced by Oxford Nanopore sequencing, and in particular the signal data from those reads (which can then be basecalled or processed in other ways).

This file format has the following design goals:

- Good write performance for MinKNOW
- Recoverable if the writing process crashes
- Good read performance for downstream tools, including basecall model generation
- Efficient use of space
- Straightforward to implement and maintain
- Extensibility

Note that trade-offs have been made between these goals, but we have mostly aimed to make those run-time decisions.

We have also chosen not to optimise for editing existing files.

More detailed information around general format goals can be found in [DESIGN](./DESIGN.md), more detailed format specification is available in [SPECIFICATION](./SPECIFICATION.md).


================================================
FILE: docs/SPECIFICATION.md
================================================
POD5 Format Specification
=========================

## Overview

The file format is, at its core, a collection of Apache Arrow tables, stored in the Apache Feather 2
(also know as Apache Arrow IPC File) format, and bundled into a container format. The container file
has the extension `.pod5`.

### Table Schemas

POD5 files are a custom wrapper format around arrow that contain several [arrow
tables](https://arrow.apache.org/docs/python/data.html#tables).

All the tables should have the following `custom_metadata` fields set on them:

| Name                    | Example Value                        | Notes                                                                                                                                       |
|-------------------------|--------------------------------------|---------------------------------------------------------------------------------------------------------------------------------------------|
| MINKNOW:pod5_version    | 1.0.0                                | The version of this specification that the schema was based on.                                                                             |
| MINKNOW:software        | MinNOW Core 5.2.3                    | A free-form description of the software that wrote the file, intended to  help pin down the source of files that violate the specification. |
| MINKNOW:file_identifier | cbf91180-0684-4a39-bf56-41eaf437de9e | Must be identical across all tables. Allows checking that the files correspond to each other.                                               |

### Extension Types

Several fields in the table schemas use [custom arrow
types](https://arrow.apache.org/docs/python/data.html#custom-schema-and-field-metadata).

#### minknow.uuid

The schemas make extensive use of UUIDs to identify reads. This is stored using an extension type,
with the following properties:

    Name: "minknow.uuid"
    Physical storage: FixedBinary(16)

#### minknow.vbz

Storage for VBZ-encoded data:

    Name: "minknow.vbz"
    Physical storage: LargeBinary

### Tables

The Reads, Signal and Run Info tables must all be present in a POD5 file. Note that some very early
POD5 files produced by pre-0.1 versions of the pod5 library did not include a Run Info table,
instead including that information in the Reads table.

#### Reads Table

The Reads table contains a single row per read, and describes the metadata for each read. The
`signal` column of the read links to the Signal table, and allows a reads signal to be retrieved.
The `run_info` column links to the the Run Info table, providing more context for the read and
avoiding duplicating data that is common to many or all reads in the file.

Some fields of the Reads table are
[dictionaries](https://arrow.apache.org/docs/python/data.html#dictionary-arrays): the contents of
the table are stored in a lookup written prior to each batch of read rows and the read row itself
then contains an integer index. This allows space savings on fields that would otherwise be
repeated. Only simple types are stored in dictionaries as third party tools have limited support for
dictionaries of structs.

[tables/reads.toml] contains specific information about fields in the reads table.

#### Signal Table

The signal table contains the (optionally compressed) signal data where one row contains sequence of
sample data, and some information about the sample data origin.

[tables/signal.toml] contains specific information about fields in the signal table.

#### Run Info Table

The run info table contains a single row per MinKNOW run that any read in the file came from.

Several fields of the Reads table are
[dictionaries](https://arrow.apache.org/docs/python/data.html#dictionary-arrays), the contents of
the table are stored in a lookup written prior to each batch of read rows, the read row itself then
contains an integer index. This allows space savings on fields that would otherwise be repeated.

[tables/run_info.toml] contains specific information about fields in the reads table.

### Combined file Layout

#### Layout

```
<signature "\213POD\r\n\032\n">
<section marker: 16 bytes>
<embedded file 1 (padded to 8-byte boundary)><section marker: 16 bytes>
...
<embedded file N (padded to 8-byte boundary)><section marker: 16 bytes>
<footer magic: "FOOTER\000\000">
<footer (padded to 8-byte boundary)>
<footer length: 8 bytes little-endian signed integer>
<section marker: 16 bytes>
<signature "\213POD\r\n\032\n">
```

All padding bytes should be zero. They ensure memory mapped files have the alignment that Arrow
expects.

#### Signature

The first and last eight bytes of the file are both a fixed set of values:

```
| Decimal          | 139  | 80   | 79   | 68   | 13   | 10   | 26   | 10   |
| Hexadecimal      | 0x8B | 0x50 | 0x4F | 0x44 | 0x0D | 0x0A | 0x1A | 0x0A |
| ASCII C Notation | \213 | P    | O    | D    | \r   | \n   | \032 | \n   |
```

The format of the signature is based on the PNG file signature, and inherits several useful features
from it for detecting file corruption:

- The first byte is non-ASCII to reduce the probability it is interpreted as a text file.
- The first byte has the high bit set to catch file transfers that clear the top bit.
- The \r\n (CRLF) sequence and the final \n (LF) byte check that nothing has attempted to
  standardise line endings in the file.
- The second-last byte (\032) is the CTRL-Z sequence, which stops file display under MS-DOS.

##### Rationale

A unique, fixed signature for the file type allows quickly identifying that the file is in the
expected format, and provides an easy way for tools like the UNIX `file` command to determine the
file type.

Placing it at the end allows quickly checking whether the file is complete.


#### Section marker

The section marker is a 16-byte UUID, generated randomly for each file. All the section markers in a
given file must be identical.

##### Rationale

This aids in recovery of partially-written files (that are missing a footer) - while most of the
embedded Arrow IPC files can be scanned easily, it may not be obvious where the footer ends. A given
randomly-generated 16-byte value is highly unlikely to occur in actual data, and can be scanned for
to find the end of the embedded file for certain. The first section marker is just so that recovery
tools know what to look for.

#### Footer magic

This is the ASCII string "FOOTER" padded to 8 bytes with zeroes. It helps find a partially-written
footer when recovering files.

#### Footer

The footer is an encoded [FlatBuffer](https://google.github.io/flatbuffers/) table, using the schema
below.

```fbs
namespace Minknow.ReadsFormat;

enum ContentType:short {
    // The Reads table (an Arrow table)
    ReadsTable,
    // The Signal table (an Arrow table)
    SignalTable,
    // An index for looking up data in the ReadsTable by read_id
    ReadIdIndex,
    // An index based on other columns and/or tables (it will need to be opened to find out what it indexes)
    OtherIndex,
}

enum Format:short {
    // The Apache Feather V2 format, also known as the Apache Arrow IPC File format.
    FeatherV2,
}

// Describes an embedded file.
table EmbeddedFile {
    // The start of the embedded file
    offset: int64;
    // The length of the embedded file (excluding any padding)
    length: int64;
    // The format of the file
    format: Format;
    // What contents should be expected in the file
    content_type: ContentType;
}

table Footer {
    // Must match the "MINKNOW:file_identifier" custom metadata entry in the schemas of the bundled tables.
    file_identifier: string;
    // A free-form description of the software that wrote the file, intended to help pin down the source of files that violate the specification.
    software: string;
    // The version of this specification that the table schemas are based on (1.0.0).
    pod5_version: string;
    // The Apache Arrow tables stored in the file.
    contents: [ EmbeddedFile ];
}
```

##### Rationale

FlatBuffers are used because the Arrow IPC file format already uses them for metadata, and they can
be read from a memory mapped file or read buffer without further copying. They are also easily (and
compatibly) extensible with more fields.

A footer is used instead of a header so the file can be written incrementally: the first table can
be written directly to the file before it is known how long it will be or even how many tables there
will be.

#### Footer length

This is a little-endian 8-byte signed integer giving the length of the footer buffer, including
padding.

##### Rationale

This allows readers to find the start of the footer by starting at the end of the file and reading
backwards.


================================================
FILE: docs/tables/reads.toml
================================================
[fields.read_id]
type = "minknow.uuid"
description = "Globally-unique identifier for the read, can be converted to a string form (using standard routines in other libraries) which matches how reads are identified elsewhere."

[fields.signal]
type = "list(uint64)"
description = "A list of zero-indexed row numbers in the Signal table. This must be all the rows in the Signal table that have a matching read_id, in order. It functions as an index for the Signal table."

[fields.channel]
type = "uint16"
description = "1-indexed channel"

[fields.well]
type = "uint8"
description = "1-indexed well (typically 1, 2, 3 or 4)"

[fields.pore_type]
type = "dictionary(string)"
description = "Name of the pore type present in the well"

[fields.calibration_offset]
type = "float"
description = "Calibration offset used to scale raw ADC data into pA readings."

[fields.calibration_scale]
type = "float"
description = "Calibration scale factor used to scale raw ADC data into pA readings."

[fields.read_number]
type = "uint32"
description = "The read number on channel. This is increasing but typically not necessarily consecutive."

[fields.start]
type = "uint64"
description = "How many samples were taken on this channel before the read started (since the data acquisition period began). This can be combined with the sample rate to get a time in seconds for the start of the read relative to the start of data acquisition."

[fields.median_before]
type = "float"
description = "The level of current in the well before this read (typically the open pore level of the well). If the level is not known (eg: due to a mux change), this should be nulled out."

# Deprecated: will be removed in 0.4.0
[fields.tracked_scaling_scale]
type = "float"
description = "Scale for tracked read scaling values (based on previous reads shift)"

# Deprecated: will be removed in 0.4.0
[fields.tracked_scaling_shift]
type = "float"
description = "Shift for tracked read scaling values (based on previous reads shift)"

# Deprecated: will be removed in 0.4.0
[fields.predicted_scaling_scale]
type = "float"
description = "Scale for predicted read scaling values (based on this read's raw signal)"

# Deprecated: will be removed in 0.4.0
[fields.predicted_scaling_shift]
type = "float"
description = "Shift for predicted read scaling values (based on this read's raw signal)"

# Deprecated: will be removed in 0.4.0
[fields.num_reads_since_mux_change]
type = "uint32"
description = "Number of selected reads since the last mux change on this reads channel"

# Deprecated: will be removed in 0.4.0
[fields.time_since_mux_change]
type = "float"
description = "Time in seconds since the last mux change on this reads channel"

[fields.num_minknow_events]
type = "uint64"
description = "Number of minknow events that the read contains"

[fields.end_reason]
type = "dictionary(string)"
description = "The end reason, currently one of: unknown, mux_change, unblock_mux_change, data_service_unblock_mux_change, signal_positive, signal_negative, api_request, device_data_error, analysis_config_change or paused."

[fields.end_reason_forced]
type = "bool"
description = "True if this read was ended 'forcibly' (eg: mux_change, unblock), false if it was a data-driven read break (signal_positive, signal_negative). This allows simple categorisation even in the presence of new reasons that reading code is unaware of."

[fields.run_info]
type = "dictionary(utf8)"
description = "The run (acquisition) this read came from. Must match the acquisition_id field of exactly one entry in the run_info table."

[fields.num_samples]
type = "uint64"
description = "The full length of the signal for this read in samples (equal to the sum of all 'samples' fields of signal chunks)"

[fields.open_pore_level]
type = "float"
description = "The open pore level for the read. A value value in pA showing the open pore level of the well prior to the read starting. If the information is not available (feature not enabled in MinKNOW, or sequencing run on an old version) this value will be NaN."


================================================
FILE: docs/tables/run_info.toml
================================================
[fields.acquisition_id]
type = "utf8"
description = "A unique identifier for the run (acquisition). This is the same identifier that MinKNOW uses to identify an acquisition within a protocol."

[fields.acquisition_start_time]
type = "timestamp(milliseconds)"
description = "This is the clock time for sample 0, and can be used together with sample_rate and the :start read field to calculate a clock time for when a given read was acquired. The timezone should be set. MinKNOW will set this to the local timezone on file creation. When merging files that have different timezones, merging code will have to pick a timezone (possibly defaulting to 'UTC')."

[fields.adc_max]
type = "int16"
description = "The maximum ADC value that might be encountered. This is a hardware constraint."

[fields.adc_min]
type = "int16"
description = "The minimum ADC value that might be encountered. This is a hardware constraint. adc_max - adc_min + 1 is the digitisation."

[fields.context_tags]
type = "map(utf8, utf8)"
description = "The context tags for the run. For compatibility with fast5. Readers must not make any assumptions about the contents of this field."

[fields.experiment_name]
type = "utf8"
description = "A user-supplied name for the experiment being run."

[fields.flow_cell_id]
type = "utf8"
description = "Uniquely identifies the flow cell the data was captured on. This is written on the flow cell case."

[fields.flow_cell_product_code]
type = "utf8"
description = "Identifies the type of flow cell the data was captured on."

[fields.protocol_name]
type = "utf8"
description = "The name of the protocol that was run."

[fields.protocol_run_id]
type = "utf8"
description = "A unique identifier for the protocol run that produced this data."

[fields.protocol_start_time]
type = "timestamp(milliseconds)"
description = "): When the protocol that the acquisition was part of started. The same considerations apply as for acquisition_start_time."

[fields.sample_id]
type = "utf8"
description = "A user-supplied name for the sample being analysed."

[fields.sample_rate]
type = "uint16"
description = "The number of samples acquired each second on each channel. This can be used to convert numbers of samples into time durations."

[fields.sequencing_kit]
type = "utf8"
description = "The type of sequencing kit used to prepare the sample."

[fields.sequencer_position]
type = "utf8"
description = "The sequencer position the data was collected on. For removable positions, like MinION Mk1Bs, this is unique (e.g. 'MN12345'), while for integrated positions it is not (e.g. 'X1' on a GridION)."

[fields.sequencer_position_type]
type = "utf8"
description = "The type of sequencing hardware the data was collected on. For example: 'MinION Mk1B' or 'GridION' or 'PromethION'."

[fields.software]
type = "utf8"
description = "A description of the software that acquired the data. For example: 'MinKNOW 21.05.12 (Bream 5.1.6, Configurations 16.2.1, Core 5.1.9, Guppy 4.2.3)'."

[fields.system_name]
type = "utf8"
description = "The name of the system the data was collected on. This might be a sequencer serial (eg: 'GXB1234') or a host name (e.g. 'Lab PC')."

[fields.system_type]
type = "utf8"
description = "The type of system the data was collected on. For example, 'GridION Mk1' or 'PromethION P48'. If the system is not a Nanopore sequencer with built-in compute, this will be a description of the operating system (e.g. 'Ubuntu 20.04')."

[fields.tracking_id]
type = "map(utf8, utf8)"
description = "The tracking id for the run. For compatibility with fast5. Readers must not make any assumptions about the contents of this field."


================================================
FILE: docs/tables/signal.toml
================================================
[fields.read_id]
type = "minknow.uuid"
description = "Globally-unique identifier for the read the data came from. This aids recovery and consistency checking."

[fields.signal]
type = [ "large_list(int16)", "minknow.vbz" ]
description = "The actual signal. The encoding of the data must the same for all reads in the file, and is determined by the choice of logical type. LargeList(Int16) is the uncompressed storage option. Readers that do not recognise the logical type of this column will be unable to decode the signal data."

[fields.samples]
type = "uint32"
description = "The number of samples stored in this row. Allows skipping over compressed chunks easily, also necessary for decoding StreamVByte-encoded data."


================================================
FILE: fuzz/.gitattributes
================================================
# Store all corpora in LFS
*.zip filter=lfs diff=lfs merge=lfs -text


================================================
FILE: fuzz/CMakeLists.txt
================================================
set(FUZZER_RUN_TIME 0 CACHE STRING "How long to run each fuzzer for. 0 indicates no limit")

# The fuzzer only uses nproc/2 workers, so limit the number of jobs to that.
include(ProcessorCount)
ProcessorCount(NUM_FUZZER_JOBS)
math(EXPR NUM_FUZZER_JOBS "${NUM_FUZZER_JOBS} / 2")

# Make sure that all issues get picked up
set(FUZZ_SANITIZER_OPTIONS
    # Note that we have to disable |detect_leaks| since arrow will allocate persistent state.
    "ASAN_OPTIONS=string_append::detect_stack_use_after_return=1:check_initialization_order=1:detect_leaks=0"
    "UBSAN_OPTIONS=string_append::print_stacktrace=1:halt_on_error=1"
)

function(make_fuzzer TYPE)
    # Extract the corpus.
    set(CORPUS ${CMAKE_CURRENT_SOURCE_DIR}/corpus_${TYPE})
    file(ARCHIVE_EXTRACT INPUT ${CORPUS}.zip DESTINATION ${CORPUS})

    if (ENABLE_FUZZERS)
        # Setup the target
        set(NAME fuzzer_${TYPE})
        add_executable(${NAME} fuzz_${TYPE}.cpp)
        target_link_libraries(${NAME} PUBLIC pod5_format)
        target_link_options(${NAME} PUBLIC -fsanitize=fuzzer)
        target_compile_definitions(${NAME} PRIVATE BUILD_SHARED_LIB=$<BOOL:${BUILD_SHARED_LIB}>)

        # Add a test for it
        add_test(
            NAME ${NAME}
            COMMAND ${NAME} -jobs=${NUM_FUZZER_JOBS} -max_total_time=${FUZZER_RUN_TIME} -timeout=100 ${CORPUS}
            # Run in the current working directory so that failing cases are dumped there.
            WORKING_DIRECTORY ${CMAKE_CURRENT_SOURCE_DIR}
        )
        set_tests_properties(${NAME} PROPERTIES ENVIRONMENT_MODIFICATION "${FUZZ_SANITIZER_OPTIONS}")
    endif()

    # Add a runner for the fuzzer in non-fuzzing builds.
    set(NAME fuzz_runner_${TYPE})
    add_executable(${NAME}
        fuzz_${TYPE}.cpp
        runner.cpp
    )
    target_link_libraries(${NAME} PRIVATE pod5_format)
    # Enable use of std::filesystem in the runner.
    target_compile_features(${NAME} PRIVATE cxx_std_17)
    # Make sure that assert() functions correctly even in Release builds.
    target_compile_options(${NAME} PRIVATE -UNDEBUG)
    target_compile_definitions(${NAME} PRIVATE BUILD_SHARED_LIB=$<BOOL:${BUILD_SHARED_LIB}>)
    add_test(
        NAME ${NAME}
        COMMAND ${NAME} ${CORPUS}
    )
    set_tests_properties(${NAME} PROPERTIES ENVIRONMENT_MODIFICATION "${FUZZ_SANITIZER_OPTIONS}")
endfunction()

make_fuzzer(compress)
make_fuzzer(file)


================================================
FILE: fuzz/fuzz_compress.cpp
================================================
#include <pod5_format/c_api.h>

#include <cassert>
#include <cstdio>
#include <cstdlib>
#include <cstring>
#include <vector>

#ifndef _WIN32
#include <unistd.h>
#else
#include <process.h>

static int setenv(char const * name, char const * value, int) { return _putenv_s(name, value); }
#endif

// No access to arrow in shared lib builds.
#if !BUILD_SHARED_LIB
#include <arrow/memory_pool.h>
#endif

#ifdef NDEBUG
#error "asserts aren't enabled"
#endif

namespace {
void CheckPod5(pod5_error_t err, char const * msg)
{
    if (err != POD5_OK) {
        printf("Assertion failed: %s - %i - %s\n", msg, err, pod5_get_error_string());
        assert(false);
    }
    if (err != pod5_get_error_no()) {
        printf("POD5 inconsistency: %s - %i != %i\n", msg, err, pod5_get_error_no());
        assert(false);
    }
}

#define CHECK_POD5(x) CheckPod5(x, #x)
}  // namespace

extern "C" int LLVMFuzzerInitialize(int * argc, char *** argv)
{
    // Make sure arrow uses the system allocator
    setenv("ARROW_DEFAULT_MEMORY_POOL", "system", 1);
#if !BUILD_SHARED_LIB
    assert(arrow::system_memory_pool()->backend_name() == "system");
#endif

    // Init pod5
    CHECK_POD5(pod5_init());
    return 0;
}

extern "C" int LLVMFuzzerTestOneInput(uint8_t const * data, size_t size)
{
    // POD5 requires non-empty input
    if (size < sizeof(int16_t)) {
        return 0;
    }

    // Copy to a new buffer of the "right" type so that we get bounds checking even if the length wasn't even
    std::vector<int16_t> input(size / sizeof(int16_t));
    std::memcpy(input.data(), data, input.size() * sizeof(int16_t));

    // Compress it
    size_t const max_compressed_size = pod5_vbz_compressed_signal_max_size(input.size());
    std::vector<char> compressed_data(max_compressed_size);
    size_t compressed_size = compressed_data.size();
    CHECK_POD5(pod5_vbz_compress_signal(
        input.data(), input.size(), compressed_data.data(), &compressed_size));
    assert(compressed_size <= max_compressed_size);

    // Update size for bounds checking when decompressing
    compressed_data =
        std::vector<char>(compressed_data.begin(), compressed_data.begin() + compressed_size);

    // Decompress it
    std::vector<int16_t> output(input.size());
    CHECK_POD5(pod5_vbz_decompress_signal(
        compressed_data.data(), compressed_data.size(), output.size(), output.data()));

    // Check it decompressed correctly
    assert(input == output);

    // See how it handles random input
    std::vector<int16_t> temp(pod5_vbz_compressed_signal_max_size(size));
    pod5_vbz_decompress_signal(
        reinterpret_cast<char const *>(data), size, temp.size(), temp.data());

    return 0;
}


================================================
FILE: fuzz/fuzz_file.cpp
================================================
#include <pod5_format/c_api.h>

#include <algorithm>
#include <array>
#include <cassert>
#include <cstdio>
#include <cstdlib>
#include <cstring>
#include <memory>
#include <random>
#include <string>
#include <vector>

#ifndef _WIN32
#include <unistd.h>
#else
#include <process.h>

static int setenv(char const * name, char const * value, int) { return _putenv_s(name, value); }
#endif

// No access to arrow in shared lib builds.
#if !BUILD_SHARED_LIB
#include <arrow/memory_pool.h>
#endif

#ifdef NDEBUG
#error "asserts aren't enabled"
#endif

namespace {
// Global state
std::string s_file_name;

// Write out data to the temp file.
char const * write_data(void const * data, size_t size)
{
    FILE * f = fopen(s_file_name.c_str(), "w");
    assert(f != nullptr);
    fwrite(data, 1, size, f);
    fclose(f);
    return s_file_name.c_str();
}

// Check the result of a POD5 call.
void check_pod5_ok(pod5_error_t err, char const * msg)
{
    if (err != POD5_OK) {
        printf("Assertion failed: %s - %i - %s\n", msg, err, pod5_get_error_string());
        assert(false);
    }
}

// Check that the return value of a function always matches pod5_get_error_no().
void check_pod5_consistency(pod5_error_t err, char const * msg)
{
    if (err != pod5_get_error_no()) {
        printf("POD5 inconsistency: %s - %i != %i\n", msg, err, pod5_get_error_no());
        assert(false);
    }
}

#define CHECK_POD5_SUCCESS(func)             \
    do {                                     \
        auto _res = func;                    \
        check_pod5_ok(_res, #func);          \
        check_pod5_consistency(_res, #func); \
    } while (false)

#define CHECK_POD5_MAY_FAIL(func) check_pod5_consistency(func, #func)

// Helper to stop the optimiser from removing results.
template <typename T>
void keep_result(T && t)
{
    auto volatile v = t;
    (void)v;
}

// Make sure that a string is NUL-terminated.
void validate_string(char const * ptr)
{
    std::string str = ptr;
    keep_result(str);
}

// File handle wrapper
struct POD5FileCloser {
    void operator()(Pod5FileReader_t * file)
    {
        if (file != nullptr) {
            CHECK_POD5_SUCCESS(pod5_close_and_free_reader(file));
        }
    }
};

using POD5File = std::unique_ptr<Pod5FileReader_t, POD5FileCloser>;
}  // namespace

extern "C" int LLVMFuzzerInitialize(int * argc, char *** argv)
{
    // Make sure arrow uses the system allocator
    setenv("ARROW_DEFAULT_MEMORY_POOL", "system", 1);
#if !BUILD_SHARED_LIB
    assert(arrow::system_memory_pool()->backend_name() == "system");
#endif

    // Init POD5
    CHECK_POD5_SUCCESS(pod5_init());

    // Setup state shared for all runs
    s_file_name = "./fuzz_tmp_" + std::to_string(getpid());
    return 0;
}

extern "C" int LLVMFuzzerTestOneInput(uint8_t const * data, size_t size)
{
    // Write the input to a file
    char const * file_path = write_data(data, size);

    // Try and open it
    POD5File file(pod5_open_file(file_path));
    if (file == nullptr) {
        return 0;
    }

    // Check that we can query info about the file.
    FileInfo_t file_info{};
    CHECK_POD5_SUCCESS(pod5_get_file_info(file.get(), &file_info));

    // If we need any more randomness, use the file's ID as a seed.
    std::seed_seq seed(std::begin(file_info.file_identifier), std::end(file_info.file_identifier));
    std::mt19937_64 rng(seed);

    // See what IDs there are
    std::size_t batch_count = 0;
    CHECK_POD5_SUCCESS(pod5_get_read_batch_count(&batch_count, file.get()));

    std::size_t total_read_count = 0;
    for (std::size_t batch_index = 0; batch_index < batch_count; ++batch_index) {
        Pod5ReadRecordBatch_t * batch = nullptr;
        CHECK_POD5_MAY_FAIL(pod5_get_read_batch(&batch, file.get(), batch_index));
        if (batch == nullptr) {
            continue;
        }

        std::size_t batch_row_count = 0;
        CHECK_POD5_SUCCESS(pod5_get_read_batch_row_count(&batch_row_count, batch));
        total_read_count += batch_row_count;

        for (std::size_t row = 0; row < batch_row_count; ++row) {
            uint16_t read_table_version = 0;
            ReadBatchRowInfo_t read_data;
            CHECK_POD5_SUCCESS(pod5_get_read_batch_row_info_data(
                batch, row, READ_BATCH_ROW_INFO_VERSION, &read_data, &read_table_version));

            // Check read formatter.
            std::array<char, 37> formatted_read_id;
            CHECK_POD5_SUCCESS(pod5_format_read_id(read_data.read_id, formatted_read_id.data()));
            validate_string(formatted_read_id.data());

            // Check signal indices.
            assert(read_data.signal_row_count >= 0);
            if (read_data.signal_row_count > 0 && read_data.signal_row_count < 1'000'000) {
                std::vector<uint64_t> indices(read_data.signal_row_count);
                CHECK_POD5_SUCCESS(
                    pod5_get_signal_row_indices(batch, row, indices.size(), indices.data()));
            }

            // Check signal extraction.
            std::size_t sample_count = 0;
            CHECK_POD5_MAY_FAIL(
                pod5_get_read_complete_sample_count(file.get(), batch, row, &sample_count));
            if (sample_count < 1'000'000) {
                std::vector<int16_t> samples(sample_count);
                CHECK_POD5_MAY_FAIL(pod5_get_read_complete_signal(
                    file.get(), batch, row, samples.size(), samples.data()));
            }

            // Check calibration data.
            CalibrationExtraData_t calib_data;
            CHECK_POD5_MAY_FAIL(pod5_get_calibration_extra_info(batch, row, &calib_data));

            // Check run info.
            RunInfoDictData_t * run_info = nullptr;
            CHECK_POD5_MAY_FAIL(pod5_get_run_info(batch, read_data.run_info, &run_info));
            // We'll do a proper check of the run info later.
            if (run_info != nullptr) {
                CHECK_POD5_SUCCESS(pod5_free_run_info(run_info));
            }
        }

        // Check run info.
        run_info_index_t run_info_count = 0;
        CHECK_POD5_MAY_FAIL(pod5_get_file_run_info_count(file.get(), &run_info_count));
        for (run_info_index_t run_info_idx = 0; run_info_idx < run_info_count; run_info_idx++) {
            RunInfoDictData_t * run_info_data = nullptr;
            CHECK_POD5_SUCCESS(pod5_get_file_run_info(file.get(), run_info_idx, &run_info_data));
            assert(run_info_data != nullptr);

            validate_string(run_info_data->acquisition_id);
            validate_string(run_info_data->experiment_name);
            validate_string(run_info_data->flow_cell_id);
            validate_string(run_info_data->flow_cell_product_code);
            validate_string(run_info_data->protocol_name);
            validate_string(run_info_data->protocol_run_id);
            validate_string(run_info_data->sample_id);
            validate_string(run_info_data->sequencing_kit);
            validate_string(run_info_data->sequencer_position);
            validate_string(run_info_data->sequencer_position_type);
            validate_string(run_info_data->software);
            validate_string(run_info_data->system_name);
            validate_string(run_info_data->system_type);
            for (std::size_t i = 0; i < run_info_data->context_tags.size; i++) {
                validate_string(run_info_data->context_tags.keys[i]);
                validate_string(run_info_data->context_tags.values[i]);
            }
            for (std::size_t i = 0; i < run_info_data->tracking_id.size; i++) {
                validate_string(run_info_data->tracking_id.keys[i]);
                validate_string(run_info_data->tracking_id.values[i]);
            }

            CHECK_POD5_SUCCESS(pod5_free_run_info(run_info_data));
        }

        // Cleanup.
        CHECK_POD5_SUCCESS(pod5_free_read_batch(batch));
    }

    {
        // Check total read count matches.
        std::size_t read_count = 0;
        CHECK_POD5_MAY_FAIL(pod5_get_read_count(file.get(), &read_count));
        if (pod5_get_error_no() == POD5_OK) {
            assert(read_count == total_read_count);
        } else {
            read_count = 0;
        }

        if (read_count > 0) {
            // Query all the reads IDs.
            std::vector<uint8_t> read_ids(read_count * sizeof(read_id_t));
            CHECK_POD5_SUCCESS(pod5_get_read_ids(
                file.get(), read_count, reinterpret_cast<read_id_t *>(read_ids.data())));

            // Randomise the order of the read IDs and then try and plan a path through them.
            std::shuffle(read_ids.begin(), read_ids.end(), rng);
            std::vector<std::uint32_t> batch_counts(read_count);
            std::vector<std::uint32_t> batch_rows(read_count);
            std::size_t find_success_count = 0;
            CHECK_POD5_MAY_FAIL(pod5_plan_traversal(
                file.get(),
                reinterpret_cast<uint8_t const *>(read_ids.data()),
                read_count,
                batch_counts.data(),
                batch_rows.data(),
                &find_success_count));
            assert(find_success_count <= read_count);
        }
    }

    // Check embedded files.
    {
        for (auto * pod5_get_embedded_file : {
                 pod5_get_file_read_table_location,
                 pod5_get_file_signal_table_location,
                 pod5_get_file_run_info_table_location,
             })
        {
            EmbeddedFileData_t file_data{};
            CHECK_POD5_SUCCESS(pod5_get_embedded_file(file.get(), &file_data));
            validate_string(file_data.file_name);
            assert(file_data.offset <= size);
            assert(file_data.length <= size - file_data.offset);
        }
    }

    return 0;
}


================================================
FILE: fuzz/runner.cpp
================================================
#include <cassert>
#include <cstdlib>
#include <filesystem>
#include <fstream>
#include <iostream>
#include <vector>

#ifdef NDEBUG
#error "asserts aren't enabled"
#endif

extern "C" {
int LLVMFuzzerInitialize(int * argc, char *** argv);
int LLVMFuzzerTestOneInput(uint8_t const * data, size_t size);
}

namespace {

void run_one(bool verbose, std::filesystem::path const & path)
{
    if (verbose) {
        std::cout << "Running " << path.string() << std::endl;
    }

    // Read it into a buffer.
    std::vector<uint8_t> data(std::filesystem::file_size(path));
    std::ifstream file(path, std::ios::in | std::ios::binary);
    file.read(reinterpret_cast<char *>(data.data()), data.size());
    assert(file);

    // Run it.
    LLVMFuzzerTestOneInput(data.data(), data.size());
}

void run_recursive(bool verbose, std::filesystem::path const & path)
{
    for (auto const & dirent : std::filesystem::directory_iterator(path)) {
        if (std::filesystem::is_directory(dirent)) {
            run_recursive(verbose, dirent.path());
        } else if (std::filesystem::is_regular_file(dirent)) {
            run_one(verbose, dirent.path());
        }
    }
}

}  // namespace

int main(int argc, char ** argv)
{
    // Parse args.
    char const * corpus = nullptr;
    bool verbose = false;
    if (argc == 3) {
        verbose = true;
        corpus = argv[2];
    } else if (argc == 2) {
        corpus = argv[1];
    } else {
        std::cerr << "Usage: " << argv[0] << " [-v] <corpus>" << std::endl;
        return EXIT_FAILURE;
    }

    // Setup.
    LLVMFuzzerInitialize(&argc, &argv);

    // Run it.
    std::filesystem::path corpus_path(corpus);
    if (std::filesystem::is_directory(corpus_path)) {
        std::cout << "Running all corpus files" << std::endl;
        run_recursive(verbose, corpus_path);
    } else if (std::filesystem::is_regular_file(corpus_path)) {
        std::cout << "Running single file" << std::endl;
        run_one(verbose, corpus_path);
    } else {
        std::cerr << "Unknown file type: " << corpus << std::endl;
        return EXIT_FAILURE;
    }

    std::cout << "Success!" << std::endl;
    return EXIT_SUCCESS;
}


================================================
FILE: pod5_make_version.py
================================================
"""
Write the POD5Version.cmake file by inspecting the _version.py file created by
setuptools_scm
"""

from pathlib import Path
from _version import __version__, __version_tuple__


def create_pod5_version_cmake():
    """Use the _version.py output from setuptools_scm to define the pod5 version"""
    with (Path(__file__).parent / "cmake/POD5Version.cmake").open("w") as _fh:
        vtup = __version_tuple__
        _fh.writelines(
            [
                "# Created by pod5_make_version.py \n",
                f"set(POD5_VERSION_MAJOR {vtup[0]} )\n",
                f"set(POD5_VERSION_MINOR {vtup[1]} )\n",
                f"set(POD5_VERSION_REV {vtup[2]} )\n",
                f"set(POD5_NUMERIC_VERSION {vtup[0]}.{vtup[1]}.{vtup[2]} )\n",
                f"set(POD5_FULL_VERSION {__version__} ) \n",
            ]
        )


def copy_version_py():
    """Copy the _version.py file into the lib_pod5 and pod5 project directories"""
    vpy = Path("_version.py")
    assert vpy.exists()

    lib_vpy = Path(__file__).parent / "python/lib_pod5/src/lib_pod5/_version.py"
    api_vpy = Path(__file__).parent / "python/pod5/src/pod5/_version.py"

    if lib_vpy.exists():
        lib_vpy.unlink()

    if api_vpy.exists():
        api_vpy.unlink()

    lib_vpy.write_bytes(vpy.read_bytes())
    api_vpy.write_bytes(vpy.read_bytes())


if __name__ == "__main__":
    print(f"Writing POD5Version.cmake with version: {__version__}")
    create_pod5_version_cmake()

    print("Copying _version.py into lib_pod5 and pod5 source directories")
    copy_version_py()


================================================
FILE: pyproject.toml
================================================
# This project file is used to generate the version information written to _version.py
# To create this file, simply pip install the root pod-file-format directory

[build-system]
requires = ["setuptools >= 61.0", "wheel", "setuptools_scm[toml]>=6.2"]
build-backend = "setuptools.build_meta"

[project]
name = "pod5version"
requires-python = ">= 3.9, < 4.0"
dynamic = ["version"]
description="Oxford Nanopore Technologies Pod5 File Format VCS Versioning"

[tool.setuptools.packages.find]
# Ignore all files
exclude = ["*"]

[tool.setuptools_scm]
root = "."
write_to = "_version.py"


================================================
FILE: pytest.ini
================================================
[pytest]
minversion = 6.0

addopts =
    # Report details on all non-passing tests
    -ra
    --verbose
    --color=yes

# Warnings are errors
filterwarnings =
    error
    ignore::DeprecationWarning

# Find tests in both python projects
testpaths =
    python/lib_pod5/
    python/pod5/


================================================
FILE: python/.gitignore
================================================
__pycache__/
*.egg-info/
*.whl
*.so
.DS_Store
licenses/


================================================
FILE: python/lib_pod5/Makefile
================================================
SHELL = /bin/bash
PYTHON ?= python3.7

envDir = venv
envPrompt ?= "lib-pod5"

.PHONY: clean venv update install

# Clean the python virtual environment
clean:
	rm -rf ${envDir}

# Create a python virtual environment
venv:
	${PYTHON} -m venv ${envDir} --prompt=${envPrompt}

# install the python project in the current venv
update:
	source ${envDir}/bin/activate \
	&& pip install --upgrade pip \
	&& pip install -e .[dev]

# Completely re-install the python environment for development
install: clean venv update
	@echo "To activate your new environment:  source ${envDir}/bin/activate"

# Build the wheel
wheel: update
	source ${envDir}/bin/activate \
	&& python -m build


================================================
FILE: python/lib_pod5/README.md
================================================
LIB_POD5 Package
================

POD5 is a file format for storing nanopore dna data in an easily accessible way.

What does this project contain
------------------------------

This project contains the low-level core library (extension modules) for reading and
writing POD5 files. This project forms the basis of the pure-python `pod5` package which
is probably the project you want.


================================================
FILE: python/lib_pod5/pyproject.toml
================================================
[build-system]
requires = ["setuptools >= 61.0", "wheel", "pybind11~=2.10.0"]
build-backend = "setuptools.build_meta"


[project]
name = "lib_pod5"
authors = [{name="Oxford Nanopore Technologies plc", email="support@nanoporetech.com"}]
readme="README.md"
requires-python=">= 3.9, < 4.0"
description="Python bindings for the POD5 file format"
dynamic = ["version"]
keywords = ['nanopore']
classifiers=[
    'Environment :: Console',
    'Intended Audience :: Developers',
    'Intended Audience :: Science/Research',
    'Natural Language :: English',
    'Programming Language :: Python :: 3',
    'Topic :: Scientific/Engineering :: Bio-Informatics',
]
dependencies = ["numpy>=1.21.0"]
license="MPL-2.0"
license-files = ["licenses/**/*"]


[project.optional-dependencies]
dev = [
    "build",
    "pytest ~= 7.3",
]

[project.urls]
Homepage = "https://github.com/nanoporetech/pod5-file-format"
Issues = "https://github.com/nanoporetech/pod5-file-format/issues"
Documentation = "https://pod5-file-format.readthedocs.io/en/latest/"

[tool.setuptools.dynamic]
version = {attr = "lib_pod5._version.__version__"}

[tool.setuptools.packages.find]
where = ["src"]
exclude = ["test"]

[tool.setuptools.package-data]
"lib_pod5" = ["*"]

[tool.black]
target-version = ["py38"]


================================================
FILE: python/lib_pod5/setup.py
================================================
"""
lib_pod5 setup.py
Proprietary and confidential information of Oxford Nanopore Technologies plc
All rights reserved; (c)2022: Oxford Nanopore Technologies plc

This script can either install a development version of pod5 to the current
Python environment, or create a Python wheel.

Note that this is *not* intended to be run from within the "pod5" folder of
the pod5_file_format repository, because the libraries are
not actually installed there. See INSTALL.md for further details.

"""

import os
import sys

import setuptools

extra_setup_args = {}

if "bdist_wheel" in sys.argv:
    # We need to convince distutils to put lib-pod5 in a platform-dependent
    # location (as opposed to a "universal" one) or auditwheel will complain
    # later. This is a hack to get it to do that.
    # See https://github.com/pypa/auditwheel/pull/28#issuecomment-212082647
    import platform
    from distutils.command.install import install

    from wheel.bdist_wheel import bdist_wheel

    class BinaryInstall(install):
        def __init__(self, dist):
            super().__init__(dist)
            # We should be able to set install_lib = self.install_platlib
            # but that doesn't appear to work on OSX or Linux, so we have to do this.
            if platform.system() != "Windows":
                self.install_lib = ""
            else:
                self.install_lib = self.install_platlib

    class BdistWheel(bdist_wheel):
        def finalize_options(self):
            bdist_wheel.finalize_options(self)
            self.root_is_pure = False

        def get_tag(self):
            python, abi, plat = bdist_wheel.get_tag(self)
            if "FORCE_PYTHON_PLATFORM" in os.environ:
                plat = os.environ["FORCE_PYTHON_PLATFORM"]
            return python, abi, plat

    extra_setup_args["cmdclass"] = {"install": BinaryInstall, "bdist_wheel": BdistWheel}


if __name__ == "__main__":
    setuptools.setup(
        has_ext_modules=lambda: True,
        **extra_setup_args,
    )


================================================
FILE: python/lib_pod5/src/lib_pod5/__init__.py
================================================
"""Imports everything from the pod5_format_pybind11 module and associated .pyi"""

from ._version import __version__, __version_tuple__
from .pod5_format_pybind import (
    EmbeddedFileData,
    FileWriter,
    FileWriterOptions,
    Pod5AsyncSignalLoader,
    Pod5FileReader,
    Pod5RepackerOutput,
    Pod5SignalCacheBatch,
    RecoverFileOptions,
    RecoveredRowCounts,
    Repacker,
    SignalType,
    compress_signal,
    create_file,
    recover_file,
    decompress_signal,
    format_read_id_to_str,
    get_error_string,
    load_read_id_iterable,
    open_file,
    update_file,
    subset_pod5s_with_mapping,
    vbz_compressed_signal_max_size,
)

__all__ = [
    "__version__",
    "__version_tuple__",
    "EmbeddedFileData",
    "FileWriter",
    "FileWriterOptions",
    "Pod5AsyncSignalLoader",
    "Pod5FileReader",
    "Pod5RepackerOutput",
    "Pod5SignalCacheBatch",
    "RecoverFileOptions",
    "RecoveredRowCounts",
    "Repacker",
    "SignalType",
    "compress_signal",
    "create_file",
    "recover_file",
    "decompress_signal",
    "format_read_id_to_str",
    "get_error_string",
    "load_read_id_iterable",
    "open_file",
    "update_file",
    "subset_pod5s_with_mapping",
    "vbz_compressed_signal_max_size",
]


================================================
FILE: python/lib_pod5/src/lib_pod5/pod5_format_pybind.pyi
================================================
"""
c++ bindings for pod5_format
"""

# pylint: skip-file

# created with mypy.stubgen for code completion
# > pip install mypy
# > stubgen -m lib_pod5.pod5_format_pybind

from typing import Any, Iterable, List, Optional, Tuple, Union

import numpy as np
import numpy.typing as npt

class CleanupError:
    description: str
    file_path: str
    def __init__(self) -> None: ...

class EmbeddedFileData:
    def __init__(self, *args, **kwargs) -> None: ...
    @property
    def length(self) -> int: ...
    @property
    def offset(self) -> int: ...
    @property
    def file_path(self) -> str: ...

class FileWriter:
    def __init__(self, *args, **kwargs) -> None: ...
    def add_end_reason(self, end_reason_enum: int) -> int: ...
    def add_pore(self, pore_type: str) -> int: ...
    def add_reads(
        self,
        count: int,
        read_ids: npt.NDArray[np.uint8],
        read_numbers: npt.NDArray[np.uint32],
        start_samples: npt.NDArray[np.uint64],
        channels: npt.NDArray[np.uint16],
        wells: npt.NDArray[np.uint8],
        pore_types: npt.NDArray[np.int16],
        calibration_offsets: npt.NDArray[np.float32],
        calibration_scales: npt.NDArray[np.float32],
        median_befores: npt.NDArray[np.float32],
        end_reasons: npt.NDArray[np.int16],
        end_reason_forceds: npt.NDArray[np.bool_],
        run_infos: npt.NDArray[np.int16],
        num_minknow_events: npt.NDArray[np.uint64],
        tracked_scaling_scales: npt.NDArray[np.float32],
        tracked_scaling_shifts: npt.NDArray[np.float32],
        predicted_scaling_scales: npt.NDArray[np.float32],
        predicted_scaling_shifts: npt.NDArray[np.float32],
        num_reads_since_mux_changes: npt.NDArray[np.uint32],
        time_since_mux_changes: npt.NDArray[np.float32],
        open_pore_levels: npt.NDArray[np.float32],
        signals: List[npt.NDArray[np.int16]],
    ) -> None: ...
    def add_reads_pre_compressed(
        self,
        count: int,
        read_ids: npt.NDArray[np.uint8],
        read_numbers: npt.NDArray[np.uint32],
        start_samples: npt.NDArray[np.uint64],
        channels: npt.NDArray[np.uint16],
        wells: npt.NDArray[np.uint8],
        pore_types: npt.NDArray[np.int16],
        calibration_offsets: npt.NDArray[np.float32],
        calibration_scales: npt.NDArray[np.float32],
        median_befores: npt.NDArray[np.float32],
        end_reasons: npt.NDArray[np.int16],
        end_reason_forceds: npt.NDArray[np.bool_],
        run_infos: npt.NDArray[np.int16],
        num_minknow_events: npt.NDArray[np.uint64],
        tracked_scaling_scales: npt.NDArray[np.float32],
        tracked_scaling_shifts: npt.NDArray[np.float32],
        predicted_scaling_scales: npt.NDArray[np.float32],
        predicted_scaling_shifts: npt.NDArray[np.float32],
        num_reads_since_mux_changes: npt.NDArray[np.uint32],
        time_since_mux_changes: npt.NDArray[np.float32],
        open_pore_levels: npt.NDArray[np.float32],
        signal_chunks: List[npt.NDArray[np.uint8]],
        signal_chunk_lengths: npt.NDArray[np.uint32],
        signal_chunk_counts: npt.NDArray[np.uint32],
    ) -> None: ...
    def add_run_info(
        self,
        acquisition_id: str,
        acquisition_start_time: int,
        adc_max: int,
        adc_min: int,
        context_tags: List[Tuple[str, str]],
        experiment_name: str,
        flow_cell_id: str,
        flow_cell_product_code: str,
        protocol_name: str,
        protocol_run_id: str,
        protocol_start_time: int,
        sample_id: str,
        sample_rate: int,
        sequencing_kit: str,
        sequencer_position: str,
        sequencer_position_type: str,
        software: str,
        system_name: str,
        system_type: str,
        tracking_id: List[Tuple[str, str]],
    ) -> int: ...
    def close(self) -> None: ...

class FileWriterOptions:
    max_signal_chunk_size: int
    read_table_batch_size: int
    signal_compression_type: Any
    signal_table_batch_size: int
    def __init__(self, *args, **kwargs) -> None: ...

class Pod5AsyncSignalLoader:
    def __init__(self, *args, **kwargs) -> None: ...
    def release_next_batch(self) -> Pod5SignalCacheBatch: ...

class Pod5FileReader:
    def __init__(self, *args, **kwargs) -> None: ...
    def batch_get_signal(
        self, get_samples: bool, get_sample_count: bool
    ) -> Pod5AsyncSignalLoader: ...
    def batch_get_signal_batches(
        self,
        get_samples: bool,
        get_samples_count: bool,
        batches: npt.NDArray[np.uint32],
    ) -> Pod5AsyncSignalLoader: ...
    def batch_get_signal_selection(
        self,
        get_samples: bool,
        get_sample_count: bool,
        batch_counts: npt.NDArray[np.uint32],
        batch_rows: npt.NDArray[np.uint32],
    ) -> Pod5AsyncSignalLoader: ...
    def close(self) -> None: ...
    def get_file_read_table_location(self) -> EmbeddedFileData: ...
    def get_file_run_info_table_location(self) -> EmbeddedFileData: ...
    def get_file_signal_table_location(self) -> EmbeddedFileData: ...
    def get_file_version_pre_migration(self) -> str: ...
    def plan_traversal(
        self,
        read_id_data: npt.NDArray[np.uint8],
        batch_counts: npt.NDArray[np.uint32],
        batch_rows: npt.NDArray[np.uint32],
    ) -> int: ...

class Pod5RepackerOutput:
    def __init__(self, *args, **kwargs) -> None: ...

class Pod5SignalCacheBatch:
    def __init__(self, *args, **kwargs) -> None: ...
    @property
    def batch_index(self) -> int: ...
    @property
    def sample_count(self) -> npt.NDArray[np.uint64]: ...
    @property
    def samples(self) -> List[npt.NDArray[np.int16]]: ...

class RecoverFileOptions:
    cleanup: bool
    file_writer_options: FileWriterOptions
    def __init__(self) -> None: ...

class RecoveredRowCounts:
    reads: int
    run_info: int
    signal: int
    def __init__(self) -> None: ...

class RecoveryDetails:
    cleanup_errors: list[CleanupError]
    row_counts: RecoveredRowCounts
    def __init__(self) -> None: ...

class Repacker:
    def __init__(self) -> None: ...
    def add_all_reads_to_output(
        self, output: Pod5RepackerOutput, input: Pod5FileReader
    ) -> None: ...
    def add_output(
        self, output: FileWriter, check_duplicate_read_ids: bool
    ) -> Pod5RepackerOutput: ...
    def add_selected_reads_to_output(
        self,
        output: Pod5RepackerOutput,
        input: Pod5FileReader,
        batch_counts: npt.NDArray[np.uint32],
        all_batch_rows: npt.NDArray[np.uint32],
    ) -> None: ...
    def finish(self) -> None: ...
    @property
    def is_complete(self) -> bool: ...
    @property
    def open_file_readers(self) -> int: ...
    @property
    def reads_completed(self) -> int: ...

def compress_signal(
    signal: npt.NDArray[np.int16], compressed_signal_out: npt.NDArray[np.uint8]
) -> int: ...
def create_file(
    src_filename: str, writer_name: str, options: Optional[FileWriterOptions]
) -> FileWriter: ...
def recover_file(
    src_filename: str, dest_filename: str, options: Optional[RecoverFileOptions]
) -> RecoveryDetails: ...
def decompress_signal(
    compressed_signal: Union[npt.NDArray[np.uint8], memoryview],
    signal_out: npt.NDArray[np.int16],
) -> None: ...
def format_read_id_to_str(
    read_id_data_out: npt.NDArray[np.uint8],
) -> List[str]: ...
def get_error_string() -> str: ...
def load_read_id_iterable(
    read_ids_str: Iterable, read_id_data_out: npt.NDArray[np.uint8]
) -> int: ...
def open_file(filename: str) -> Pod5FileReader: ...
def update_file(reader: Pod5FileReader, output: str): ...
def vbz_compressed_signal_max_size(sample_count: int) -> int: ...


================================================
FILE: python/lib_pod5/src/lib_pod5/py.typed
================================================


================================================
FILE: python/lib_pod5/src/test/test_lib_pod5.py
================================================
"""
Basic lib pod5 tets
"""

from pathlib import Path

from lib_pod5 import Pod5FileReader, create_file, open_file


def test_create_file(tmp_path: Path) -> None:
    """Test that a lib-pod5 can create a pod5 file"""

    target = tmp_path / "test.pod5"
    assert tmp_path.exists()
    assert not target.exists()

    create_file(str(target), "test")
    assert target.exists()


def test_open_file(tmp_path: Path) -> None:
    """Test that a lib-pod5 can create and re-open a pod5 file"""
    target = tmp_path / "test.pod5"
    create_file(str(target), "test")
    assert target.exists()

    reader = open_file(str(target))
    assert isinstance(reader, Pod5FileReader)

    reader.close()


================================================
FILE: python/pod5/Makefile
================================================
SHELL = /bin/bash
PYTHON ?= python3.7

envDir = venv
envPrompt ?= "pod5"

.PHONY: clean install update docs

# Clean the python virtual environment
clean:
	rm -rf ${envDir}

# Completely install the python environment for development
install: clean
	${PYTHON} -m venv --prompt=${envPrompt} ${envDir}
	source ${envDir}/bin/activate \
	&& pip install --upgrade pip \
	&& pip install -e .[dev] \
	&& pre-commit install

	@echo "To activate your new environment:  source ${envDir}/bin/activate"

# Re-install the pod5 environments to refresh / update the environment with changes
update:
	source ${envDir}/bin/activate \
	&& pip install -e .[dev]

	@echo "Updated python environment"


================================================
FILE: python/pod5/README.md
================================================
# POD5 Python Package

The `pod5` Python package contains the tools and python API wrapping the compiled bindings
for the POD5 file format from `lib_pod5`.

## Installation

The `pod5` package is available on [pypi](https://pypi.org/project/pod5/) and is
installed using `pip`:

``` console
  > pip install pod5
```

## Usage

### Reading a POD5 File

To read a `pod5` file provide the the `Reader` class with the input `pod5` file path
and call `Reader.reads()` to iterate over read records in the file. The example below
prints the read_id of every record in the input `pod5` file.

``` python
import pod5 as p5

with p5.Reader("example.pod5") as reader:
    for read_record in reader.reads():
        print(read_record.read_id)
```

To iterate over a selection of read_ids supply `Reader.reads()` with a collection
of read_ids which must be `UUID` compatible:

``` python
import pod5 as p5

# Create a collection of read_id UUIDs
read_ids: List[str] = [
  "00445e58-3c58-4050-bacf-3411bb716cc3",
  "00520473-4d3d-486b-86b5-f031c59f6591",
]

with p5.Reader("example.pod5") as reader:
    for read_record in reader.reads(selection=read_ids):
        assert str(read_record.read_id) in read_ids
```

### Plotting Signal Data Example

Here is an example of how a user may plot a read’s signal data against time.

``` python
import matplotlib.pyplot as plt
import numpy as np

import pod5 as p5

# Using the example pod5 file provided
example_pod5 = "test_data/multi_fast5_zip.pod5"
selected_read_id = '0000173c-bf67-44e7-9a9c-1ad0bc728e74'

with p5.Reader(example_pod5) as reader:

    # Read the selected read from the pod5 file
    # next() is required here as Reader.reads() returns a Generator
    read = next(reader.reads(selection=[selected_read_id]))

    # Get the signal data and sample rate
    sample_rate = read.run_info.sample_rate
    signal = read.signal

    # Compute the time steps over the sampling period
    time = np.arange(len(signal)) / sample_rate

    # Plot using matplotlib
    plt.plot(time, signal)
```

### Writing a POD5 File

The `pod5` package provides the functionality to write POD5 files.

It is strongly recommended that users first look at the available tools when
manipulating existing datasets, as there may already be a tool to meet your needs.
New tools may be added to support our users and if you have a suggestion for a
new tool or feature please submit a request on the
[pod5-file-format GitHub issues page](https://github.com/nanoporetech/pod5-file-format/issues).

Below is an example of how one may add reads to a new POD5 file using the `Writer`
and its `add_read()` method.

```python
import pod5 as p5

# Populate container classes for read metadata
pore = p5.Pore(channel=123, well=3, pore_type="pore_type")
calibration = p5.Calibration(offset=0.1, scale=1.1)
end_reason = p5.EndReason(name=p5.EndReasonEnum.SIGNAL_POSITIVE, forced=False)
run_info = p5.RunInfo(
    acquisition_id = ...
    acquisition_start_time = ...
    adc_max = ...
    ...
)
signal = ... # some signal data as numpy np.int16 array

read = p5.Read(
    read_id=UUID("0000173c-bf67-44e7-9a9c-1ad0bc728e74"),
    end_reason=end_reason,
    calibration=calibration,
    pore=pore,
    run_info=run_info,
    ...
    signal=signal,
)

with p5.Writer("example.pod5") as writer:
    # Write the read object
    writer.add_read(read)
```

## Tools

1. [pod5 view](#pod5-view)
2. [pod5 inspect](#pod5-inspect)
3. [pod5 merge](#pod5-merge)
4. [pod5 filter](#pod5-filter)
5. [pod5 subset](#pod5-subset)
6. [pod5 repack](#pod5-repack)
7. [pod5 recover](#pod5-recover)
8. [pod5 convert fast5](#pod5-convert-fast5)
9. [pod5 convert to_fast5](#pod5-convert-to_fast5)
10. [pod5 update](#pod5-update)

The ``pod5`` package provides the following tools for inspecting and manipulating
POD5 files as well as converting between ``.pod5`` and ``.fast5`` file formats.

To disable the `tqdm <https://github.com/tqdm/tqdm>`_  progress bar set the environment
variable ``POD5_PBAR=0``.

To enable debugging output which may also output detailed log files, set the environment
variable ``POD5_DEBUG=1``

### Pod5 View

The ``pod5 view`` tool is used to produce a table similarr to a sequencing summary
from the contents of ``.pod5`` files. The default output is a tab-separated table
written to stdout with all available fields.

This tools is indented to replace ``pod5 inspect reads`` and is over 200x faster.

``` bash
> pod5 view --help

# View the list of fields with a short description in-order (shortcut -L)
> pod5 view --list-fields

# Write the summary to stdout
> pod5 view input.pod5

# Write the summary of multiple pod5s to a file
> pod5 view *.pod5 --output summary.tsv

# Write the summary as a csv
> pod5 view *.pod5 --output summary.csv --separator ','

# Write only the read_ids with no header (shorthand -IH)
> pod5 view input.pod5 --ids --no-header

# Write only the listed fields
# Note: The field order is fixed the order shown in --list-fields
> pod5 view input.pod5 --include "read_id, channel, num_samples, end_reason"

# Exclude some unwanted fields
> pod5 view input.pod5 --exclude "filename, pore_type"
```

### Pod5 inspect

The ``pod5 inspect`` tool can be used to extract details and summaries of
the contents of ``.pod5`` files. There are two programs for users within ``pod5 inspect``
and these are read and reads

``` bash
> pod5 inspect --help
> pod5 inspect {reads, read, summary} --help
```

#### Pod5 inspect reads

> :warning: This tool is deprecated and has been replaced by ``pod5 view`` which is significantly faster.

Inspect all reads and print a csv table of the details of all reads in the given ``.pod5`` files.

``` bash
> pod5 inspect reads pod5_file.pod5

  read_id,channel,well,pore_type,read_number,start_sample,end_reason,median_before,calibration_offset,calibration_scale,sample_count,byte_count,signal_compression_ratio
  00445e58-3c58-4050-bacf-3411bb716cc3,908,1,not_set,100776,374223800,signal_positive,205.3,-240.0,0.1,65582,58623,0.447
  00520473-4d3d-486b-86b5-f031c59f6591,220,1,not_set,7936,16135986,signal_positive,192.0,-233.0,0.1,167769,146495,0.437
    ...
```

#### Pod5 inspect read

Inspect the pod5 file, find a specific read and print its details.

``` console
> pod5 inspect read pod5_file.pod5 00445e58-3c58-4050-bacf-3411bb716cc3

  File: out-tmp/output.pod5
  read_id: 0e5d6827-45f6-462c-9f6b-21540eef4426
  read_number:    129227
  start_sample:   367096601
  median_before:  171.889404296875
  channel data:
  channel: 2366
  well: 1
  pore_type: not_set
  end reason:
  name: signal_positive
  forced False
  calibration:
  offset: -243.0
  scale: 0.1462070643901825
  samples:
  sample_count: 81040
  byte_count: 71989
  compression ratio: 0.444
  run info
      acquisition_id: 2ca00715f2e6d8455e5174cd20daa4c38f95fae2
      acquisition_start_time: 2021-07-23 13:48:59.780000
      adc_max: 0
      adc_min: 0
      context_tags
      barcoding_enabled: 0
      basecall_config_filename: dna_r10.3_450bps_hac_prom.cfg
      experiment_duration_set: 2880
      ...
```

### Pod5 merge

``pod5 merge`` is a tool for merging multiple  ``.pod5`` files into one monolithic pod5 file.

The contents of the input files are checked for duplicate read_ids to avoid
accidentally merging identical reads. To override this check set the argument
``-D / --duplicate-ok``

``` bash
# View help
> pod5 merge --help

# Merge a pair of pod5 files
> pod5 merge example_1.pod5 example_2.pod5 --output merged.pod5

# Merge a glob of pod5 files
> pod5 merge *.pod5 -o merged.pod5

# Merge a glob of pod5 files ignoring duplicate read ids
> pod5 merge *.pod5 -o merged.pod5 --duplicate-ok
```

### Pod5 filter

``pod5 filter`` is a simpler alternative to ``pod5 subset`` where reads are subset from
one or more input ``.pod5`` files using a list of read ids provided using the ``--ids`` argument
and writing those reads to a *single* ``--output`` file.

See ``pod5 subset`` for more advanced subsetting.

``` bash
> pod5 filter example.pod5 --output filtered.pod5 --ids read_ids.txt
```

The ``--ids`` selection text file must be a simple list of valid UUID read_ids with
one read_id per line. Only records which match the UUID regex (lower-case) are used.
Lines beginning with a ``#`` (hash / pound symbol) are interpreted as comments.
Empty lines are not valid and may cause errors during parsing.

> The ``filter`` and ``subset`` tools will assert that any requested read_ids are
> present in the inputs. If a requested read_id is missing from the inputs
> then the tool will issue the following error:
>
> ``` bash
> POD5 has encountered an error: 'Missing read_ids from inputs but --missing-ok not set'
> ```
>
> To disable this warning then the '-M / --missing-ok' argument.

When supplying multiple input files to 'filter' or 'subset', the tools is
effectively performing a ``merge`` operation. The 'merge' tool is better suited
for handling very large numbers of input files.

#### Example filtering pipeline

This is a trivial example of how to select a random sample of 1000 read_ids from a
pod5 file using ``pod5 view`` and ``pod5 filter``.

``` bash
# Get a random selection of read_ids
> pod5 view all.pod5 --ids --no-header --output all_ids.txt
> all_ids.txt sort --random-sort | head --lines 1000 > 1k_ids.txt

# Filter to that selection
> pod5 filter all.pod5 --ids 1k_ids.txt --output 1k.pod5

# Check the output
> pod5 view 1k.pod5 -IH | wc -l
1000
```

### Pod5 subset

``pod5 subset`` is a tool for subsetting reads in ``.pod5`` files into one or more
output ``.pod5`` files. See also ``pod5 filter``

The ``pod5 subset`` tool requires a *mapping* which defines which read_ids should be
written to which output. There are multiple ways of specifying this mapping which are
defined in either a ``.csv`` file or by using a ``--table`` (csv or tsv)
and instructions on how to interpret it.

``pod5 subset`` aims to be a generic tool to subset from multiple inputs to multiple outputs.
If your use-case is to ``filter`` read_ids from one or more inputs into a single output
then ``pod5 filter`` might be a more appropriate tool as the only input is a list of read_ids.

``` bash
# View help
> pod5 subset --help

# Subset input(s) using a pre-defined mapping
> pod5 subset example_1.pod5 --csv mapping.csv

# Subset input(s) using a dynamic mapping created at runtime
> pod5 subset example_1.pod5 --table table.txt --columns barcode
```

> Care should be taken to ensure that when providing multiple input ``.pod5`` files to ``pod5 subset``
> that there are no read_id UUID clashes. If a duplicate read_id is detected an exception
> will be raised unless the ``--duplicate-ok`` argument is set. If ``--duplicate-ok`` is
> set then both reads will be written to the output, although this is not recommended.

#### Note on positional arguments

> The ``--columns`` argument will greedily consume values and as such, care should be taken
> with the placement of any positional arguments. The following line will result in an error
> as the input pod5 file is consumed by ``--columns`` resulting in no input file being set.

```bash
# Invalid placement of positional argument example.pod5
$ pod5 subset --table table.txt --columns barcode example.pod5
```

#### Creating a Subset Mapping

##### Target Mapping (.csv)

The example below shows a ``.csv`` subset target mapping. Any lines (e.g. header line)
which do not have a read_id which matches the UUID regex (lower-case) in the second
column is ignored.

``` text
target, read_id
output_1.pod5,132b582c-56e8-4d46-9e3d-48a275646d3a
output_1.pod5,12a4d6b1-da6e-4136-8bb3-1470ef27e311
output_2.pod5,0ff4dc01-5fa4-4260-b54e-1d8716c7f225
output_2.pod5,0e359c40-296d-4edc-8f4a-cca135310ab2
output_2.pod5,0e9aa0f8-99ad-40b3-828a-45adbb4fd30c
```

##### Target Mapping from Table

``pod5 subset`` can dynamically generate output targets and collect associated reads
based on a text file containing a table (csv or tsv) parsible by ``polars``.
This table file could be the output from ``pod5 view`` or from a sequencing summary.
The table must contain a header row and a series of columns on which to group unique
collections of values. Internally this process uses the
`polars.Dataframe.group_by <https://pola-rs.github.io/polars/py-polars/html/reference/dataframe/api/polars.DataFrame.group_by.html>`_
function where the ``by`` parameter is the sequence of column names specified with
the ``--columns`` argument.

Given the following example ``--table`` file, observe the resultant outputs given various
arguments:

``` text
read_id    mux    barcode      length
read_a     1      barcode_a    4321
read_b     1      barcode_b    1000
read_c     2      barcode_b    1200
read_d     2      barcode_c    1234
```

``` bash
> pod5 subset example_1.pod5 --output barcode_subset --table table.txt --columns barcode
> ls barcode_subset
barcode-barcode_a.pod5     # Contains: read_a
barcode-barcode_b.pod5     # Contains: read_b, read_c
barcode-barcode_c.pod5     # Contains: read_d

> pod5 subset example_1.pod5 --output mux_subset --table table.txt --columns mux
> ls mux_subset
mux-1.pod5     # Contains: read_a, read_b
mus-2.pod5     # Contains: read_c, read_d

> pod5 subset example_1.pod5 --output barcode_mux_subset --table table.txt --columns barcode mux
> ls barcode_mux_subset
barcode-barcode_a_mux-1.pod5    # Contains: read_a
barcode-barcode_b_mux-1.pod5    # Contains: read_b
barcode-barcode_b_mux-2.pod5    # Contains: read_c
barcode-barcode_c_mux-2.pod5    # Contains: read_d
```

##### Output Filename Templating

When subsetting using a table the output filename is generated from a template
string. The automatically generated template is the sequential concatenation of
``column_name-column_value`` followed by the ``.pod5`` file extension.

The user can set their own filename template using the ``--template`` argument.
This argument accepts a string in the `Python f-string style <https://docs.python.org/3/tutorial/inputoutput.html#formatted-string-literals>`_
where the subsetting variables are used for keyword placeholder substitution.
Keywords should be placed within curly-braces. For example:

``` bash
# default template used = "barcode-{barcode}.pod5"
> pod5 subset example_1.pod5 --output barcode_subset --table table.txt --columns barcode

# default template used = "barcode-{barcode}_mux-{mux}.pod5"
> pod5 subset example_1.pod5 --output barcode_mux_subset --table table.txt --columns barcode mux

> pod5 subset example_1.pod5 --output barcode_subset --table table.txt --columns barcode --template "{barcode}.subset.pod5"
> ls barcode_subset
barcode_a.subset.pod5    # Contains: read_a
barcode_b.subset.pod5    # Contains: read_b, read_c
barcode_c.subset.pod5    # Contains: read_d
```

##### Example subsetting from ``pod5 inspect reads``

The ``pod5 inspect reads`` tool will output a csv table summarising the content of the
specified ``.pod5`` file which can be used for subsetting. The example below shows
how to split a ``.pod5`` file by the well field.

``` bash
# Create the csv table from inspect reads
> pod5 inspect reads example.pod5 > table.csv
> pod5 subset example.pod5 --table table.csv --columns well
```

### Pod5 repack

``pod5 repack`` will simply repack ``.pod5`` files into one-for-one output files of the same name.

``` bash
> pod5 repack pod5s/*.pod5 repacked_pods/
```

### Pod5 Recover

``pod5 recover`` will attempt to recover data from corrupted or truncated ``.pod5`` files
by copying all valid table batches and cleanly closing the new files. New files are written
as siblings to the inputs with the `_recovered.pod5` suffix.

``` bash
> pod5 recover --help
> pod5 recover broken.pod5
> ls
broken.pod5 broken_recovered.pod5
```

### pod5 convert fast5

The ``pod5 convert fast5`` tool takes one or more ``.fast5`` files and converts them
to one or more ``.pod5`` files.

If the tool detects single-read fast5 files, please convert them into multi-read
fast5 files using the tools available in the ``ont_fast5_api`` project.

The progress bar shown during conversion assumes the number of reads in an input
``.fast5`` is 4000. The progress bar will update the total value during runtime if
required.

> Some content previously stored in ``.fast5`` files is **not** compatible with the POD5
> format and will not be converted. This includes all analyses stored in the
> ``.fast5`` file.
>
> Please ensure that any other data is recovered from ``.fast5`` before deletion.

By default ``pod5 convert fast5`` will show exceptions raised during conversion as *warnings*
to the user. This is to gracefully handle potentially corrupt input files or other
runtime errors in long-running conversion tasks. The ``--strict`` argument allows
users to opt-in to strict runtime assertions where any exception raised will promptly
stop the conversion process with an error.

``` bash
# View help
> pod5 convert fast5 --help

# Convert fast5 files into a monolithic output file
> pod5 convert fast5 ./input/*.fast5 --output converted.pod5

# Convert fast5 files into a monolithic output in an existing directory
> pod5 convert fast5 ./input/*.fast5 --output outputs/
> ls outputs/
output.pod5 # default name

# Convert each fast5 to its relative converted output. The output files are written
# into the output directory at paths relatve to the path given to the
# --one-to-one argument. Note: This path must be a relative parent to all
# input paths.
> ls input/*.fast5
file_1.fast5 file_2.fast5 ... file_N.fast5
> pod5 convert fast5 ./input/*.fast5 --output output_pod5s/ --one-to-one ./input/
> ls output_pod5s/
file_1.pod5 file_2.pod5 ... file_N.pod5

# Note the different --one-to-one path which is now the current working directory.
# The new sub-directory output_pod5/input is created.
> pod5 convert fast5 ./input/*.fast5 output_pod5s --one-to-one ./
> ls output_pod5s/
input/file_1.pod5 input/file_2.pod5 ... input/file_N.pod5

# Convert all inputs so that they have neibouring pod5 in current directory
> pod5 convert fast5 *.fast5 --output . --one-to-one .
> ls
file_1.fast5 file_1.pod5 file_2.fast5 file_2.pod5  ... file_N.fast5 file_N.pod5

# Convert all inputs so that they have neibouring pod5 files from a parent directory
> pod5 convert fast5 ./input/*.fast5 --output ./input/ --one-to-one ./input/
> ls input/*
file_1.fast5 file_1.pod5 file_2.fast5 file_2.pod5  ... file_N.fast5 file_N.pod5
```

### Pod5 convert to_fast5

The ``pod5 convert to_fast5`` tool takes one or more ``.pod5`` files and converts them
to multiple ``.fast5`` files. The default behaviour is to write 4000 reads per output file
but this can be controlled with the ``--file-read-count`` argument.

``` bash
# View help
> pod5 convert to_fast5 --help

# Convert pod5 files to fast5 files with default 4000 reads per file
> pod5 convert to_fast5 example.pod5 --output pod5_to_fast5/
> ls pod5_to_fast5/
output_1.fast5 output_2.fast5 ... output_N.fast5
```

### Pod5 Update

The ``pod5 update`` tools is used to update old pod5 files to use the latest schema.
Currently the latest schema version is version 3.

Files are written into the ``--output`` directory with the same name.

``` bash
> pod5 update --help

# Update a named files
> pod5 update my.pod5 --output updated/
> ls updated
updated/my.pod5

# Update an entire directory
> pod5 update old/ -o updated/
```


================================================
FILE: python/pod5/examples/find_all_reads.py
================================================
#!/usr/bin/python3

import argparse
from pathlib import Path

import pod5 as p5


def main():
    parser = argparse.ArgumentParser("Iterate through all read ids in an pod5 file")
    parser.add_argument("input", type=Path)
    args = parser.parse_args()

    with p5.Reader(args.input) as reader:
        for read in reader.reads():
            print(f"Found read {read.read_id}")
            print(f"  Read has  {read.sample_count} samples")


if __name__ == "__main__":
    main()


================================================
FILE: python/pod5/examples/find_specific_reads.py
================================================
#!/usr/bin/python3

import argparse
from pathlib import Path
from uuid import UUID

import pandas as pd

import pod5 as p5


def main():
    parser = argparse.ArgumentParser(
        "Iterate through specific read ids in an pod5 file"
    )
    parser.add_argument("input", type=Path)
    parser.add_argument("read_ids_csv", type=Path)
    args = parser.parse_args()

    read_ids_to_find = [UUID(r) for r in pd.read_csv(args.read_ids_csv)["read_id"]]

    with p5.Reader(args.input) as reader:
        for read in reader.reads(read_ids_to_find):
            print(f"Found read {read.read_id}")
            print(f"  Read has  {read.sample_count} samples")


if __name__ == "__main__":
    main()


================================================
FILE: python/pod5/pyproject.toml
================================================
[build-system]
requires = ["setuptools >= 61.0", "wheel"]
build-backend = "setuptools.build_meta"


[project]
name = "pod5"
authors = [
  { name = "Oxford Nanopore Technologies plc", email = "support@nanoporetech.com" },
]
readme = "README.md"
requires-python=">= 3.9, < 4.0"
description = "Oxford Nanopore Technologies Pod5 File Format Python API and Tools"
dynamic = ["version"]
keywords = ['nanopore']
classifiers = [
  'Environment :: Console',
  'Intended Audience :: Developers',
  'Intended Audience :: Science/Research',
  'Natural Language :: English',
  'Programming Language :: Python :: 3',
  'Topic :: Scientific/Engineering :: Bio-Informatics',
]
license="MPL-2.0"

dependencies = [
  "deprecated ~= 1.2.18",
  "lib_pod5 == 0.3.39",
  "iso8601",
  "more_itertools",
  "numpy >= 1.21.0",
  'typing-extensions; python_version<"3.10"',
  'pyarrow ~= 22.0.0; python_version>="3.10"',
  'pyarrow ~= 18.0.0; python_version<"3.10"',
  "pytz",
  "packaging",
  "polars ~= 1.30",
  'h5py ~= 3.11',
  "vbz_h5py_plugin",
  "tqdm",
]

[project.optional-dependencies]
dev = [
  "black == 23.3.0",
  "mypy == 1.3.0",
  "pre-commit==v2.21.0",
  "psutil",
  "pytest ~= 7.3",
  "pytest-cov ~= 4.0",
  "pytest-mock",
  "types-Deprecated",
  "types-setuptools",
  "types-pytz",
]

[project.scripts]
pod5 = "pod5.tools.main:main"

[project.urls]
Homepage = "https://github.com/nanoporetech/pod5-file-format"
Issues = "https://github.com/nanoporetech/pod5-file-format/issues"
Documentation = "https://pod5-file-format.readthedocs.io/en/latest/"

[tool.setuptools.packages.find]
where = ["src"]
exclude = ["test*"]

[tool.setuptools.dynamic]
version = { attr = "pod5._version.__version__" }

[tool.black]
target-version = ["py37"]


================================================
FILE: python/pod5/setup.py
================================================
"""
pod5 setup.py
Proprietary and confidential information of Oxford Nanopore Technologies plc
All rights reserved; (c)2022: Oxford Nanopore Technologies plc

This script can either install a development version of pod5 to the current
Python environment, or create a Python wheel.

"""

import setuptools

if __name__ == "__main__":
    setuptools.setup()


================================================
FILE: python/pod5/src/pod5/__init__.py
================================================
"""POD5 Format

Bindings for the POD5 file format
"""

# Pull the version from the pyproject.toml
import sys

if sys.version_info >= (3, 8):
    from importlib import metadata
else:
    import importlib_metadata as metadata

__version__ = metadata.version("pod5")

from .api_utils import (
    format_read_id_to_str,
    format_read_ids,
    load_read_id_iterable,
    pack_read_ids,
)
from .pod5_types import (
    Calibration,
    CompressedRead,
    EndReason,
    EndReasonEnum,
    Pore,
    Read,
    RunInfo,
)
from .reader import Reader, ReadRecord, ReadRecordBatch
from .dataset import DatasetReader
from .signal_tools import (
    vbz_compress_signal,
    vbz_decompress_signal,
    vbz_decompress_signal_chunked,
    vbz_decompress_signal_into,
)
from .writer import SignalType, Writer

__all__ = (
    "__version__",
    "format_read_id_to_str",
    "format_read_ids",
    "load_read_id_iterable",
    "pack_read_ids",
    "DatasetReader",
    "Calibration",
    "CompressedRead",
    "EndReason",
    "EndReasonEnum",
    "Pore",
    "Read",
    "RunInfo",
    "Reader",
    "ReadRecord",
    "ReadRecordBatch",
    "SignalType",
    "vbz_compress_signal",
    "vbz_decompress_signal",
    "vbz_decompress_signal_chunked",
    "vbz_decompress_signal_into",
    "Writer",
)


================================================
FILE: python/pod5/src/pod5/api_utils.py
================================================
"""
Utility functions for the pod5 API
"""

import warnings
from typing import Any, Collection, List, Union

import numpy as np
import numpy.typing as npt
import pyarrow as pa
from lib_pod5 import format_read_id_to_str, load_read_id_iterable


class Pod5ApiException(Exception):
    """Generic Pod5 API Exception"""


def pack_read_ids(
    read_ids: Collection[str], invalid_ok: bool = False
) -> npt.NDArray[np.uint8]:
    """
    Convert a `Collection` of `read_id` strings to a `numpy.ndarray`
    in preparation for writing to pod5 files.

    Parameters
    ----------
    read_ids : Collection[str]
        Collection of well-formatted read_id strings

    Returns
    -------
    packed_read_ids : numpy.ndarray[uint8]
        Repacked read_ids ready for writing to pod5 files.
    """
    read_id_data = np.empty(shape=(len(read_ids), 16), dtype=np.uint8)
    count = load_read_id_iterable(read_ids, read_id_data)
    if invalid_ok is False and count != len(read_ids):
        raise RuntimeError("Invalid read id passed")

    return read_id_data[:count]


def format_read_ids(
    read_ids: Union[npt.NDArray[np.uint8], pa.lib.FixedSizeBinaryArray],
) -> List[str]:
    """
    Convert a packed array of read_ids and convert them to a list of strings.

    Parameters
    ----------
    read_ids : numpy.ndarray[uint8], pa.lib.FixedSizeBinaryArray
        Packed read_ids from a numpy.ndarray or read directly from pod5 file

    Returns
    -------
    read_ids : list[str]
        A list of converted read_ids as strings
    """
    if isinstance(read_ids, pa.lib.FixedSizeBinaryArray):
        read_ids = read_ids.buffers()[1]
    return format_read_id_to_str(read_ids)


def deprecation_warning(deprecated: str, alternate: str) -> None:
    """
    Issue a `FutureWarning` warning that `deprecated` has been deprecated in favour of
    `alternate`.

    Parameters
    ----------
    deprecated : str
        The module path to the deprecated item
    alternate : str
        The module path to the alternate item
    """
    warnings.warn(
        f"{deprecated} is deprecated. Please use {alternate}",
        DeprecationWarning,
        stacklevel=2,
    )


def safe_close(obj: Any, attr: str) -> None:
    """
    Try to close() an object's attribute ignoring any exceptions raised.
    This is used to safely handle closing potentially unassigned attributes
    while calling close() in __del__()
    """
    if not hasattr(obj, attr):
        return

    try:
        getattr(obj, attr).close()
    except Exception:
        pass


================================================
FILE: python/pod5/src/pod5/dataset.py
================================================
from concurrent.futures import Future, ThreadPoolExecutor, as_completed
from functools import lru_cache, partial
import os
from pathlib import Path
from typing import (
    Any,
    Callable,
    Collection,
    Dict,
    Generator,
    Iterable,
    List,
    Optional,
    Set,
    Union,
)
import warnings
from pod5.api_utils import Pod5ApiException

from pod5.pod5_types import PathOrStr
from pod5.reader import ReadRecord, Reader
from pod5.tools.utils import search_path

DEFAULT_CPUS = min(os.cpu_count() or 1, 4)


class DatasetReader:
    def __init__(
        self,
        paths: Union[PathOrStr, Collection[PathOrStr]],
        recursive: bool = False,
        pattern: str = "*.pod5",
        index: bool = False,
        threads: int = DEFAULT_CPUS,
        max_cached_readers: Optional[int] = 2**4,
        warn_duplicate_indexing: bool = True,
    ) -> None:
        """
        Reads pod5 files and/or directories of pod5 files as a dataset.

        Parameters
        ----------
        paths : PathOrStr | Collection[PathOrStr]
            One or more files or directories to load
        recursive : bool
            Search directories in `paths` recursively
        pattern : str
            A glob expression to match against file names
        index : bool
            Promptly index the dataset instead of deferring until required
        threads : int
            The number of threads to use
        max_cached_readers :  Optional[int]
            The maximum size of the `Reader` LRU cache. Set to `None` for an unlimited
            cache size.
        warn_duplicate_indexing : bool
            Issue warnings when duplicate read_ids are detected and
            indexing by read_id is attempted

        Note
        ----
        Random record access is implemented by creating an index of read_id to file
        path. This can consume a large amount of memory. Methods that generate an index
        have this noted in their docstring.

        Warnings
        --------
        If duplicate read_ids are present in the dataset, iterator methods such
        as `reads()` will yield all copies. Indexing methods such as `get_read`
        return one chosen randomly and issue a warning which can be suppressed by
        setting `warn_duplicate_indexing=False`
        """
        self._paths: List[Path] = sorted(
            self._collect_dataset(
                paths, recursive=recursive, pattern=pattern, threads=threads
            )
        )
        self._num_reads: Optional[int] = None
        self._max_cached_readers = max_cached_readers
        self.threads = threads
        self.warn_duplicate_indexing = warn_duplicate_indexing

        # Cache on DatasetReader instances and control cache size on init
        self._get_reader = self._init_get_reader(self._max_cached_readers)

        if index:
            self._index_read_ids()
        else:
            self._index: Optional[Dict[str, Path]] = None

    def __iter__(self) -> Generator[ReadRecord, None, None]:
        yield from self.reads()

    def __len__(self) -> int:
        """Returns the number of reads in this dataset"""
        return self.num_reads

    @property
    def num_reads(self) -> int:
        """
        Return the number of `ReadRecords` in this dataset.
        """
        if self._num_reads is not None:
            return self._num_reads

        def _get_num_reads(path: Path) -> int:
            try:
                return self.get_reader(path).num_reads
            except Exception as exc:
                msg = f"DatasetReader error reading: {[path]}"
                raise Pod5ApiException(msg) from exc

        self._num_reads = sum(
            self._run_max_workers(_get_num_reads, self.paths, self.threads)
        )
        return self._num_reads

    @property
    def paths(self) -> List[Path]:
        """Return the list of pod5 file paths in this dataset"""
        return self._paths

    @property
    def read_ids(self) -> Generator[str, None, None]:
        """
        Yield all read_ids in this dataset
        """

        def _get_read_ids(path: Path) -> List[str]:
            return self.get_reader(path).read_ids

        for ids in self._run_max_workers(_get_read_ids, self.paths, self.threads):
            yield from ids

    def reads(
        self,
        selection: Optional[Iterable[str]] = None,
        preload: Optional[Set[str]] = None,
    ) -> Generator[ReadRecord, None, None]:
        """
        Iterate over ``ReadRecord``s in the dataset.

        Parameters
        ----------
        selection : iterable[str]
            The read ids to walk in the file.
        preload : set[str]
            Columns to preload - "samples" and "sample_count" are valid values

        Note
        ----
        ``ReadRecord``s are yielded in on-disk record order for each file in ``self.paths``.

        Missing records are not detected and multiple records will be
        yielded if there are duplicates in either of the dataset or selection.

        Yields
        ------
        ReadRecord
        """

        def _get_reads_iter(path: Path) -> Generator[ReadRecord, None, None]:
            return self.get_reader(path).reads(
                selection=selection, missing_ok=True, preload=preload
            )

        for reads in self._run_max_workers(_get_reads_iter, self.paths, self.threads):
            yield from reads

    def get_read(self, read_id: str) -> Optional[ReadRecord]:
        """
        Get a `ReadRecord` by `read_id` or return `None` if it is missing

        Parameters
        ----------
        read_id : str
            The read_id (UUID) string in this dataset to find

        Note
        ----
        This method will index the dataset

        Warnings
        --------
        Issues a warning if duplicate read_ids are detected in this dataset.
        The returned `ReadRecord` is a always valid but the source may be random
        between instances of a `DatasetReader`.

        Returns
        -------
        Optional[ReadRecord]
        """
        path = self.get_path(read_id)
        if path is None:
            return None

        reader = self.get_reader(path)
        try:
            return next(reader.reads(selection=[read_id]))
        except StopIteration:
            return None

    @staticmethod
    def _init_get_reader(maxsize: Optional[int]) -> Callable[[Path], Reader]:
        # This wrapper allows the size of the LRU cache to be set during initialization
        # without global variables.

        # Note that a Pod5.Reader consumes at least 4 file handles.
        # If you experience "Too Many Open Files" reduce the `max_cached_readers` and `threads`
        @lru_cache(maxsize=maxsize)
        def _get_reader(path: Path) -> Reader:
            return Reader(path)

        return _get_reader

    def get_reader(self, path: PathOrStr) -> Reader:
        """
        Get a pod5 file `Reader` in this dataset by `path`

        Parameters
        ----------
        path : PathOrStr
            Path to a pod5 file

        Returns
        -------
        Reader
        """
        return self._get_reader(Path(path))

    def get_path(self, read_id: str) -> Optional[Path]:
        """
        Get the pod5 `Path` for a given `read_id` or `None` if it was not found

        Parameters
        ----------
        read_id : str
            The read_id (UUID) string in this dataset

        Note
        ----
        This method will index the dataset

        Warnings
        --------
        Issues a warning if duplicate read_ids are detected in this dataset.
        The returned path is a always valid file which contains this read_id but this
        may be random between instances.

        Returns
        -------
        Optional[Path]
        """

        self.index_read_ids()
        if self._index is None:
            return None

        if self.has_duplicate():
            self._issue_duplicate_read_warning()

        return self._index.get(read_id, None)

    def clear_readers(self) -> None:
        """Clears the readers LRU cache"""
        self._get_reader.cache_clear()  # type: ignore

    def clear_index(self) -> None:
        """Clears the read_id to file path index"""
        self._index = None

    def has_duplicate(self) -> bool:
        """
        Returns `True` if there are duplicate `read_ids` in this dataset

        Note
        ----
        This method will index the dataset
        """
        self.index_read_ids()
        assert self._index is not None
        return len(self) != len(self._index)

    @staticmethod
    def _collect_dataset(
        paths: Union[PathOrStr, Collection[PathOrStr]],
        recursive: bool,
        pattern: str,
        threads: int,
    ) -> Set[Path]:
        if isinstance(paths, (str, Path, os.PathLike)):
            paths = [paths]

        if not isinstance(paths, Collection):
            raise TypeError(
                f"paths must be a Collection[PathOrStr] but found {type(paths)=}"
            )

        paths = [Path(p) for p in paths]
        collected: Set[Path] = set()
        with ThreadPoolExecutor(max_workers=threads) as executor:
            search = partial(search_path, recursive=recursive, patterns=[pattern])
            for coll in executor.map(search, paths):
                collected.update(coll)
        return collected

    def index_read_ids(self) -> None:
        """
        Performs read_id indexing if not already done.
        """
        if self._index is None:
            self._index_read_ids()
        return

    def _index_read_ids(self) -> None:
        def _get_index(path: Path) -> Dict[str, Path]:
            try:
                return {read_id: path for read_id in self.get_reader(path).read_ids}
            except Exception as exc:
                msg = f"DatasetReader error reading: {[path]}"
                raise Pod5ApiException(msg) from exc

        self._index = {}
        for index_item in self._run_max_workers(_get_index, self.paths, self.threads):
            self._index.update(index_item)

    def _issue_duplicate_read_warning(self) -> None:
        if self.warn_duplicate_indexing:
            warnings.warn("duplicate read_ids found in dataset")

    @staticmethod
    def _run_max_workers(
        fn: Callable[[Any], Any], iterable: Iterable[Any], max_workers: int
    ) -> Generator[Any, None, None]:
        assert max_workers > 0
        futures: Set[Future] = set()
        with ThreadPoolExecutor(max_workers=max_workers) as executor:
            for item in iterable:
                futures.add(executor.submit(fn, item))
                if len(futures) >= max_workers:
                    future = next(as_completed(futures))
                    yield future.result()
                    futures.remove(future)

            for future in as_completed(futures):
                yield future.result()

    def __enter__(self) -> "DatasetReader":
        return self

    def __exit__(self, *exc_details) -> None:
        self.clear_index()
        self.clear_readers()


================================================
FILE: python/pod5/src/pod5/pod5_types.py
================================================
"""
Container class for a pod5 Read object
"""

import datetime
import enum
import math
import os
from dataclasses import dataclass, field
from typing import Dict, List, Union
from uuid import UUID

import numpy as np
import numpy.typing as npt

from pod5.signal_tools import vbz_decompress_signal_chunked

PathOrStr = Union[os.PathLike, str]


class EndReasonEnum(enum.Enum):
    """EndReason Enumeration"""

    UNKNOWN = 0
    MUX_CHANGE = 1
    UNBLOCK_MUX_CHANGE = 2
    DATA_SERVICE_UNBLOCK_MUX_CHANGE = 3
    SIGNAL_POSITIVE = 4
    SIGNAL_NEGATIVE = 5
    API_REQUEST = 6
    DEVICE_DATA_ERROR = 7
    ANALYSIS_CONFIG_CHANGE = 8
    PAUSED = 9


# The bool encodes if the reads are "forced" to end. Reads are forced to end if it is due to
# some stimulus outside of the signal such as a device-error or an unblock operation.
_END_REASON_FORCED_DEFAULTS: Dict[EndReasonEnum, bool] = {
    EndReasonEnum.UNKNOWN: False,
    EndReasonEnum.MUX_CHANGE: True,
    EndReasonEnum.UNBLOCK_MUX_CHANGE: True,
    EndReasonEnum.DATA_SERVICE_UNBLOCK_MUX_CHANGE: True,
    EndReasonEnum.SIGNAL_POSITIVE: False,
    EndReasonEnum.SIGNAL_NEGATIVE: False,
    EndReasonEnum.API_REQUEST: True,
    EndReasonEnum.DEVICE_DATA_ERROR: True,
    EndReasonEnum.ANALYSIS_CONFIG_CHANGE: True,
    EndReasonEnum.PAUSED: True,
}


@dataclass(frozen=True)
class EndReason:
    """
    Data on why the Read ended.

    Parameters
    ----------

    reason: EndReasonEnum
        The end reason enumeration.
    forced: bool
        True if it is a 'forced' read break.
    """

    #: The end reason enumeration
    reason: EndReasonEnum
    #: True if it is a 'forced' read break (e.g. mux_change, unblock), False otherwise.
    forced: bool

    @property
    def name(self) -> str:
        """Return the reason name as a lower string"""
        return self.reason.name.lower()

    @classmethod
    def from_reason_with_default_forced(cls, reason: EndReasonEnum) -> "EndReason":
        """
        Return a new EndReason instance with the 'forced' flag set to the expected
        default for the given reason
        """
        return cls(reason=reason, forced=_END_REASON_FORCED_DEFAULTS[reason])


@dataclass()
class Calibration:
    """
    Parameters to convert the signal data to picoamps.

    Parameters
    ----------

    offset: float
        Calibration offset used to convert raw ADC data into pA readings.
    scale: float
        Calibration scale factor used to convert raw ADC data into pA readings.
    """

    #: Calibration offset used to convert raw ADC data into pA readings.
    offset: float
    #: Calibration scale factor used to convert raw ADC data into pA readings.
    scale: float

    @classmethod
    def from_range(
        cls, offset: float, adc_range: float, digitisation: float
    ) -> "Calibration":
        """Create a Calibration instance from offset, adc_range and digitisation"""
        return cls(offset, adc_range / digitisation)


@dataclass()
class Pore:
    """
    Data for the pore that the Read was acquired on

    Parameters
    ----------

    channel: int
        1-indexed channel.
    well: int
        1-indexed well.
    pore_type: PoreType
        The pore type present in the well.
    """

    #: 1-indexed channel.
    channel: int
    #: 1-indexed well.
    well: int
    #: Name of the pore type present in the well.
    pore_type: str


@dataclass(frozen=True)
class RunInfo:
    """
    Higher-level information about the Reads that correspond to a part of an
    experiment, protocol or acquisition

    Parameters
    ----------

    acquisition_id : str
        A unique identifier for the acquisition.
    acquisition_start_time : datetime.datetime
        This is the clock time for sample 0
    adc_max : int
        The maximum ADC value that might be encountered.
    adc_min : int
        The minimum ADC value that might be encountered.
    context_tags : Dict[str, str]
        The context tags for the run. (For compatibility with fast5).
    experiment_name : str
        The user-supplied name for the experiment being run.
    flow_cell_id : str
        Uniquely identifies the flow cell the data was captured on.
    flow_cell_product_code : str
        Identifies the type of flow cell the data was captured on.
    protocol_name : str
        The name of the protocol that was run.
    protocol_run_id : str
        The unique identifier for the protocol run that produced this data.
    protocol_start_time : datetime.datetime
         When the protocol that the acquisition was part of started.
    sample_id : str
        A user-supplied name for the sample being analysed.
    sample_rate : int
        The number of samples acquired each second on each channel.
    sequencing_kit : str
        The type of sequencing kit used to prepare the sample.
    sequencer_position : str
        The sequencer position the data was collected on.
    sequencer_position_type : str
        The type of sequencing hardware the data was collected on.
    software : str
        A description of the software that acquired the data.
    system_name : str
        The name of the system the data was collected on.
    system_type : str
        The type of system the data was collected on.
    tracking_id : Dict[str, str]
        The tracking id for the run. (For compatibility with fast5).

    """

    #: A unique identifier for the acquisition - note that readers should not
    #: depend on this uniquely determining the other fields in the run_info, or being
    #: unique among the dictionary keys.
    acquisition_id: str
    #: This is the clock time for sample 0
    acquisition_start_time: datetime.datetime
    #: The maximum ADC value that might be encountered. This is a hardware constraint.
    adc_max: int
    #: The minimum ADC value that might be encountered. This is a hardware constraint.
    adc_min: int
    #: The context tags for the run. (For compatibility with fast5).
    context_tags: Dict[str, str] = field(hash=False, compare=True)
    #: The user-supplied name for the experiment being run.
    experiment_name: str
    #: Uniquely identifies the flow cell the data was captured on.
    #: This is written on the flow cell case.
    flow_cell_id: str
    #: Identifies the type of flow cell the data was captured on.
    flow_cell_product_code: str
    #: The name of the protocol that was run.
    protocol_name: str
    #: The unique identifier for the protocol run that produced this data.
    protocol_run_id: str
    #:  When the protocol that the acquisition was part of started.
    protocol_start_time: datetime.datetime
    #: A user-supplied name for the sample being analysed.
    sample_id: str
    #: The number of samples acquired each second on each channel.
    sample_rate: int
    #: The type of sequencing kit used to prepare the sample.
    sequencing_kit: str
    #: The sequencer position the data was collected on. For removable positions,
    #: like MinION Mk1Bs, this is unique (e.g. 'MN12345'), while for integrated
    #: positions it is not (e.g. 'X1' on a GridION).
    sequencer_position: str
    #: The type of sequencing hardware the data was collected on. For example:
    #: 'MinION Mk1B' or 'GridION' or 'PromethION'.
    sequencer_position_type: str
    #: A description of the software that acquired the data. For example:
    #: 'MinKNOW 21.05.12 (Bream 5.1.6, Configurations 16.2.1, Core 5.1.9, Guppy 4.2.3)'.
    software: str
    #: The name of the system the data was collected on. This might be a sequencer
    #: serial (eg: 'GXB1234') or a host name (e.g. 'Lab PC').
    system_name: str
    #: The type of system the data was collected on. For example, 'GridION Mk1' or
    #: 'PromethION P48'. If the system is not a Nanopore sequencer with built-in
    #: compute, this will be a description of the operating system
    #: (e.g. 'Ubuntu 20.04').
    system_type: str
    #: The tracking id for the run. (For compatibility with fast5).
    tracking_id: Dict[str, str] = field(hash=False, compare=True)


@dataclass()
class ShiftScalePair:
    """A pair of floating point shift and scale values."""

    shift: float = field(default=float("nan"))
    scale: float = field(default=float("nan"))

    def __eq__(self, other: object) -> bool:
        if not isinstance(other, type(self)):
            return False
        if all(
            math.isnan(x) for x in (self.shift, self.scale, other.shift, other.scale)
        ):
            return True
        return self.shift == other.shift and self.scale == other.scale


@dataclass()
class BaseRead:
    """
    Base class for POD5 Read Data

    Parameters
    ----------

    read_id : UUID
        The read_id of this read as UUID.
    pore : Pore
        Pore data.
    calibration : Calibration
        Calibration data.
    read_number : int
        The read number on channel. This is increasing but typically
        not necessarily consecutive.
    start_sample : int
        The number samples recorded on this channel before the read started.
    median_before : float
        The level of current in the well before this read.
    end_reason : EndReason
        EndReason data.
    run_info : RunInfo
        RunInfo data.
    num_minknow_events: int
        Number of minknow events that the read contains
    tracked_scaling: ShiftScalePair
        Shift and Scale for tracked read scaling values (based on previous reads shift)
    predicted_scaling: ShiftScalePair
        Shift and Scale for predicted read scaling values (based on this read's raw signal)
    num_reads_since_mux_change: int
        Number of selected reads since the last mux change on this reads channel
    time_since_mux_change: float
        Time in seconds since the last mux change on this reads channel
    open_pore_level: float
        The tracked open pore level for the read.
    """

    #: The read_id of this read as UUID
    read_id: UUID
    #: Pore metadata
    pore: Pore
    #: Calibration metadata
    calibration: Calibration
    #: The read number on channel. This is increasing but typically
    #: not necessarily consecutive.
    read_number: int
    #: The number samples recorded on this channel before the read started.
    start_sample: int
    #: The level of current in the well before this read.
    median_before: float
    #: EndReason data.
    end_reason: EndReason
    #: RunInfo data.
    run_info: RunInfo
    #: Number of minknow events that the read contains
    num_minknow_events: int = field(default=0)
    #: Shift and Scale for tracked read scaling values (based on previous reads shift)
    tracked_scaling: ShiftScalePair = field(default_factory=ShiftScalePair)
    #: Shift and Scale for predicted read scaling values (based on this read's raw signal)
    predicted_scaling: ShiftScalePair = field(default_factory=ShiftScalePair)
    #: Number of selected reads since the last mux change on this reads channel
    num_reads_since_mux_change: int = field(default=0)
    #: Time in seconds since the last mux change on this reads channel
    time_since_mux_change: float = field(default=0.0)
    #: The tracked open pore level for the read.
    open_pore_level: float = field(default=float("nan"))


@dataclass()
class Read(BaseRead):
    """
    POD5 Read Data with an uncompressed signal

    Parameters
    ----------

    read_id : UUID
        The read_id of this read as UUID.
    pore : Pore
        Pore data.
    calibration : Calibration
        Calibration data.
    read_number : int
        The read number on channel. This is increasing but typically
        not necessarily consecutive.
    start_sample : int
        The number samples recorded on this channel before the read started.
    median_before : float
        The level of current in the well before this read.
    end_reason : EndReason
        EndReason data.
    run_info : RunInfo
        RunInfo data.
    signal : numpy.array[int16]
        Uncompressed signal data.
    """

    #: Uncompressed signal data.
    signal: npt.NDArray[np.int16] = field(
        default_factory=lambda: np.array([], dtype=np.int16)
    )

    @property
    def sample_count(self) -> int:
        """Return the total number of samples in the uncompressed signal."""
        return len(self.signal)


@dataclass()
class CompressedRead(BaseRead):
    """
    POD5 Read Data with a compressed signal.

    Parameters
    ----------

    read_id : UUID
        The read_id of this read as UUID.
    pore : Pore
        Pore data.
    calibration : Calibration
        Calibration data.
    read_number : int
        The read number on channel. This is increasing but typically
        not necessarily consecutive.
    start_sample : int
        The number samples recorded on this channel before the read started.
    median_before : float
        The level of current in the well before this read.
    end_reason : EndReason
        EndReason data.
    run_info : RunInfo
        RunInfo data.
    signal_chunks : List[numpy.array[uint8]]
        Compressed signal data in chunks.
    signal_chunk_lengths : List[int]
        Chunk lengths (number of samples) of signal data **before** compression.
    """

    #: Compressed signal data in chunks.
    signal_chunks: List[npt.NDArray[np.uint8]] = field(default_factory=list)

    #: Chunk lengths (number of samples) of signal data **before** compression.
    signal_chunk_lengths: List[int] = field(default_factory=list)

    @property
    def sample_count(self) -> int:
        """Return the total number of samples in the uncompressed signal."""
        return sum(self.signal_chunk_lengths)

    @property
    def decompressed_signal(self) -> npt.NDArray[np.int16]:
        """
        Decompress and return the chunked signal data as a contiguous numpy array.

        Returns
        -------
        decompressed_signal : numpy.array[int16]
            Decompressed signal data
        """
        return vbz_decompress_signal_chunked(
            self.signal_chunks, self.signal_chunk_lengths
        )


================================================
FILE: python/pod5/src/pod5/reader.py
================================================
"""
Tools for accessing POD5 data from PyArrow files
"""

import mmap
from collections import namedtuple
from dataclasses import fields
from deprecated import deprecated
from io import BufferedReader, IOBase
import os
from pathlib import Path
from typing import (
    Collection,
    Dict,
    Generator,
    Iterable,
    List,
    Optional,
    Set,
    Tuple,
    Union,
)
from uuid import UUID

import lib_pod5 as p5b
import numpy as np
import numpy.typing as npt
import packaging.version
import pyarrow as pa

from pod5.pod5_types import (
    Calibration,
    EndReason,
    EndReasonEnum,
    PathOrStr,
    Pore,
    Read,
    RunInfo,
    ShiftScalePair,
)

from .api_utils import Pod5ApiException, format_read_ids, pack_read_ids, safe_close
from .signal_tools import vbz_decompress_signal, vbz_decompress_signal_into


ReadRecordV3Columns = namedtuple(
    "ReadRecordV3Columns",
    [
        "read_id",
        "read_number",
        "start",
        "channel",
        "well",
        "median_before",
        "pore_type",
        "calibration_offset",
        "calibration_scale",
        "end_reason",
        "end_reason_forced",
        "run_info",
        "signal",
        "num_minknow_events",
        # Deprecated: will be removed in 0.4.0
        "tracked_scaling_scale",
        # Deprecated: will be removed in 0.4.0
        "tracked_scaling_shift",
        # Deprecated: will be removed in 0.4.0
        "predicted_scaling_scale",
        # Deprecated: will be removed in 0.4.0
        "predicted_scaling_shift",
        # Deprecated: will be removed in 0.4.0
        "num_reads_since_mux_change",
        # Deprecated: will be removed in 0.4.0
        "time_since_mux_change",
        "num_samples",
    ],
)

ReadRecordV4Columns = namedtuple(
    "ReadRecordV4Columns",
    [
        "read_id",
        "read_number",
        "start",
        "channel",
        "well",
        "median_before",
        "pore_type",
        "calibration_offset",
        "calibration_scale",
        "end_reason",
        "end_reason_forced",
        "run_info",
        "signal",
        "num_minknow_events",
        # Deprecated: will be removed in 0.4.0
        "tracked_scaling_scale",
        # Deprecated: will be removed in 0.4.0
        "tracked_scaling_shift",
        # Deprecated: will be removed in 0.4.0
        "predicted_scaling_scale",
        # Deprecated: will be removed in 0.4.0
        "predicted_scaling_shift",
        # Deprecated: will be removed in 0.4.0
        "num_reads_since_mux_change",
        # Deprecated: will be removed in 0.4.0
        "time_since_mux_change",
        "num_samples",
        "open_pore_level",
    ],
)


Signal = namedtuple("Signal", ["signal", "samples"])
SignalRowInfo = namedtuple(
    "SignalRowInfo",
    ["batch_index", "batch_row_index", "sample_count", "byte_count"],
)


class ReadRecord:
    """
    Represents the data for a single read from a pod5 record.
    """

    def __init__(
        self,
        reader: "Reader",
        batch: "ReadRecordBatch",
        row: int,
        batch_signal_cache: Optional[List[npt.NDArray[np.int16]]] = None,
        selected_batch_index: Optional[int] = None,
    ):
        """ """
        self._reader = reader
        self._batch = batch
        self._row = row
        self._batch_signal_cache = batch_signal_cache
        self._selected_batch_index = selected_batch_index

    @property
    def read_id(self) -> UUID:
        """
        Get the unique read identifier for the read as a `UUID`.
        """
        return UUID(bytes=self._batch.columns.read_id[self._row].as_py())

    @property
    def read_number(self) -> int:
        """
        Get the integer read number of the read.
        """
        return self._batch.columns.read_number[self._row].as_py()  # type: ignore

    @property
    def start_sample(self) -> int:
        """
        Get the absolute sample which the read started.
        """
        return self._batch.columns.start[self._row].as_py()  # type: ignore

    @property
    def num_samples(self) -> int:
        """
        Get the number of samples in the reads signal data.
        """
        return self._batch.columns.num_samples[self._row].as_py()  # type: ignore

    @property
    def median_before(self) -> float:
        """
        Get the median before level (in pico amps) for the read.
        """
        return self._batch.columns.median_before[self._row].as_py()  # type: ignore

    @property
    def num_minknow_events(self) -> int:
        """
        Find the number of minknow events in the read.
        """
        return self._batch.columns.num_minknow_events[self._row].as_py()  # type: ignore

    @property
    @deprecated(
        version="0.4.0", reason="Scaling fields were unused and will be removed"
    )
    def tracked_scaling(self) -> ShiftScalePair:
        """
        Find the tracked scaling value in the read.
        """
        return ShiftScalePair(
            self._batch.columns.tracked_scaling_shift[self._row].as_py(),
            self._batch.columns.tracked_scaling_scale[self._row].as_py(),
        )

    @property
    @deprecated(
        version="0.4.0", reason="Scaling fields were unused and will be removed"
    )
    def predicted_scaling(self) -> ShiftScalePair:
        """
        Find the predicted scaling value in the read.
        """
        return ShiftScalePair(
            self._batch.columns.predicted_scaling_shift[self._row].as_py(),
            self._batch.columns.predicted_scaling_scale[self._row].as_py(),
        )

    @property
    @deprecated(
        version="0.4.0", reason="Scaling fields were unused and will be removed"
    )
    def num_reads_since_mux_change(self) -> int:
        """
        Number of selected reads since the last mux change on this reads channel.
        """
        return self._batch.columns.num_reads_since_mux_change[self._row].as_py()  # type: ignore

    @property
    @deprecated(
        version="0.4.0", reason="Scaling fields were unused and will be removed"
    )
    def time_since_mux_change(self) -> float:
        """
        Time in seconds since the last mux change on this reads channel.
        """
        return self._batch.columns.time_since_mux_change[self._row].as_py()  # type: ignore

    @property
    def open_pore_level(self) -> float:
        """
        Get the open pore level for the read.

        This is a float value representing the open pore level of the well prior to the read starting.
        """
        return self._batch.columns.open_pore_level[self._row].as_py()

    @property
    def pore(self) -> Pore:
        """
        Get the pore data associated with the read.
        """
        return Pore(
            self._batch.columns.channel[self._row].as_py(),
            self._batch.columns.well[self._row].as_py(),
            self._batch.columns.pore_type[self._row].as_py(),
        )

    @property
    def calibration(self) -> Calibration:
        """
        Get the calibration data associated with the read.
        """
        return Calibration(
            self._batch.columns.calibration_offset[self._row].as_py(),
            self._batch.columns.calibration_scale[self._row].as_py(),
        )

    @property
    def calibration_digitisation(self) -> int:
        """
        Get the digitisation value used by the sequencer.

        Intended to assist workflows ported from legacy file formats.
        """
        return self.run_info.adc_max - self.run_info.adc_min + 1

    @property
    def calibration_range(self) -> float:
        """
        Get the calibration range value.

        Intended to assist workflows ported from legacy file formats.
        """
        return self.calibration.scale * self.calibration_digitisation

    @property
    def end_reason(self) -> EndReason:
        """
        Get the end reason data associated with the read.
        """
        return EndReason(
            reason=EndReasonEnum[
                self._batch.columns.end_reason[self._row].as_py().upper()
            ],
            forced=self._batch.columns.end_reason_forced[self._row].as_py(),
        )

    @property
    def run_info(self) -> RunInfo:
        """
        Get the run info data associated with the read.
        """
        return self._reader._lookup_run_info(self._batch, self._row)

    @property
    def end_reason_index(self) -> int:
        """
        Get the dictionary index of the end reason data associated with the read.
        This property is the same as the EndReason enumeration value.
        """
        return self._batch.columns.end_reason[self._row].index.as_py()  # type: ignore

    @property
    def run_info_index(self) -> int:
        """
        Get the dictionary index of the run info data associated with the read.
        """
        return self._batch.columns.run_info[self._row].index.as_py()  # type: ignore

    @property
    def sample_count(self) -> int:
        """
        Get the number of samples in the reads signal data.
        """
        return self.num_samples

    @property
    def byte_count(self) -> int:
        """
        Get the number of bytes used to store the reads data.
        """
        return sum(r.byte_count for r in self.signal_rows)

    @property
    def has_cached_signal(self) -> bool:
        """
        Get if cached signal is available for this read.
        """
        return self._batch_signal_cache is not None

    @property
    def signal(self) -> npt.NDArray[np.int16]:
        """
        Get the full signal for the read.

        Returns
        -------
        numpy.ndarray[int16]
            A numpy array of signal data with int16 type.
        """
        if self._batch_signal_cache is not None:
            if self._selected_batch_index is not None:
                return self._batch_signal_cache[self._selected_batch_index]
            return self._batch_signal_cache[self._row]

        rows = self._batch.columns.signal[self._row]
        batch_data = [self._find_signal_row_index(r.as_py()) for r in rows]
        sample_counts = []
        for batch, _, batch_row_index in batch_data:
            sample_counts.append(batch.samples[batch_row_index].as_py())

        output = np.empty(dtype=np.int16, shape=(sum(sample_counts),))
        current_sample_index = 0

        for i, (batch, _, batch_row_index) in enumerate(batch_data):
            signal = batch.signal
            current_row_count = sample_counts[i]
            output_slice = output[
                current_sample_index : current_sample_index + current_row_count
            ]
            if self._reader.is_vbz_compressed:
                vbz_decompress_signal_into(
                    memoryview(signal[batch_row_index].as_buffer()), output_slice
                )
            else:
                output_slice[:] = signal[batch_row_index].values
            current_sample_index += current_row_count
        return output

    @property
    def signal_pa(self) -> npt.NDArray[np.float32]:
        """
        Get the full signal for the read, calibrated in pico amps.

        Returns
        -------
        numpy.ndarray[float32]
            A numpy array of signal data in pico amps with float32 type.
        """
        return self.calibrate_signal_array(self.signal)

    def signal_for_chunk(self, index: int) -> npt.NDArray[np.int16]:
        """
        Get the signal for a given chunk of the read.

        Returns
        -------
        numpy.ndarray[int16]
            A numpy array of signal data with int16 type for the specified chunk.
        """
        # signal_rows can be used to find details of the signal chunks.
        chunk_abs_row_index = self._batch.columns.signal[self._row][index]
        return self._get_signal_for_row(chunk_abs_row_index.as_py())

    @property
    def signal_rows(self) -> List[SignalRowInfo]:
        """
        Get all signal rows for the read

        Returns
        -------
        list[SignalRowInfo]
            A list of signal row data (as SignalRowInfo) in the read.
        """

        def map_signal_row(sig_row) -> SignalRowInfo:
            sig_row = sig_row.as_py()

            batch, batch_index, batch_row_index = self._find_signal_row_index(sig_row)
            batch_length = 0
            if isinstance(batch.signal, pa.lib.LargeListArray):
                batch_length = len(batch.signal[batch_row_index])
            else:
                batch_length = len(batch.signal[batch_row_index].as_buffer())
            return SignalRowInfo(
                batch_index,
                batch_row_index,
                batch.samples[batch_row_index].as_py(),
                batch_length,
            )

        return [map_signal_row(r) for r in self._batch.columns.signal[self._row]]

    def calibrate_signal_array(
        self, signal_array_adc: npt.NDArray[np.int16]
    ) -> npt.NDArray[np.float32]:
        """
        Transform an array of int16 signal data from ADC space to pA.

        Returns
        -------
        A numpy array of signal data with float32 type.
        """
        offset = np.float32(self.calibration.offset)
        scale = np.float32(self.calibration.scale)
        return (signal_array_adc + offset) * scale

    def _find_signal_row_index(self, signal_row: int) -> Tuple[Signal, int, int]:
        """
        Map from a signal_row to a Signal, batch index and row index within that batch.

        Returns
        -------
        A Tuple containing the `Signal` and its `batch_index` and `row_index`
        """
        sig_row_count: int = self._reader.signal_batch_row_count
        sig_batch_idx: int = signal_row // sig_row_count
        sig_batch = self._reader._get_signal_batch(sig_batch_idx)
        batch_row_idx: int = signal_row - (sig_batch_idx * sig_row_count)

        return sig_batch, sig_batch_idx, batch_row_idx

    def _get_signal_for_row(self, signal_row: int) -> npt.NDArray[np.int16]:
        """
        Get the signal data for a given absolute signal row index

        Returns
        -------
        A numpy array of signal data with int16 type.
        """
        batch, _, batch_row_index = self._find_signal_row_index(signal_row)

        signal = batch.signal
        if self._reader.is_vbz_compressed:
            sample_count = batch.samples[batch_row_index].as_py()
            return vbz_decompress_signal(
                memoryview(signal[batch_row_index].as_buffer()), sample_count
            )

            return signal.to_numpy()
        else:
            return np.array(signal[batch_row_index].values, dtype="int16")

    def to_read(self) -> Read:
        """
        Create a mutable `Read` from this `ReadRecord` instance.

        Returns
        -------
        Read
        """
        return Read(
            read_id=self.read_id,
            pore=self.pore,
            calibration=self.calibration,
            median_before=self.median_before,
            end_reason=self.end_reason,
            read_number=self.read_number,
            run_info=self.run_info,
            start_sample=self.start_sample,
            num_minknow_events=self.num_minknow_events,
            tracked_scaling=self.tracked_scaling,
            predicted_scaling=self.predicted_scaling,
            num_reads_since_mux_change=self.num_reads_since_mux_change,
            time_since_mux_change=self.time_since_mux_change,
            open_pore_level=self.open_pore_level,
            signal=self.signal,
        )


class ReadRecordBatch:
    """
    Read data for a batch of reads.
    """

    def __init__(self, reader: "Reader", batch: pa.RecordBatch):
        """ """

        self._reader: "Reader" = reader
        self._batch: pa.RecordBatch = batch

        self._signal_cache: Optional[p5b.Pod5SignalCacheBatch] = None
        self._selected_batch_rows: Optional[Iterable[int]] = None
        self._columns: Optional[ReadRecordV4Columns] = None

    @property
    def columns(self) -> ReadRecordV4Columns:
        """Return the data from this batch as a ReadRecordColumns instance"""
        if self._columns is None:
            self._columns = ReadRecordV4Columns(
                *[
                    self._batch.column(name)
                    for name in self._reader._columns_type._fields
                ]
            )
        return self._columns

    def set_cached_signal(self, signal_cache: p5b.Pod5SignalCacheBatch) -> None:
        """Set the signal cache"""
        self._signal_cache = signal_cache

    def set_selected_batch_rows(self, selected_batch_rows: Iterable[int]) -> None:
        """Set the selected batch rows"""
        self._selected_batch_rows = selected_batch_rows

    def reads(self) -> Generator[ReadRecord, None, None]:
        """
        Iterate all reads in this batch.

        Yields
        ------
        ReadRecord
            ReadRecord instances in the file.
        """

        signal_cache = None
        if self._signal_cache and self._signal_cache.samples:
            signal_cache = self._signal_cache.samples

        if self._selected_batch_rows is not None:
            for idx, row in enumerate(self._selected_batch_rows):
                yield ReadRecord(
                    self._reader,
                    self,
                    row,
                    batch_signal_cache=signal_cache,
                    selected_batch_index=idx,
                )
        else:
            for i in range(self.num_reads):
                yield ReadRecord(self._reader, self, i, batch_signal_cache=signal_cache)

    def get_read(self, row: int) -> ReadRecord:
        """Get the ReadRecord at row index"""
        return ReadRecord(self._reader, self, row)

    @property
    def num_reads(self) -> int:
        """Return the number of rows in this RecordBatch"""
        return int(self._batch.num_rows)

    @property
    def read_id_column(self) -> pa.FixedSizeBinaryArray:
        """
        Get the column of read ids for this batch
        """
        if self._selected_batch_rows is not None:
            return self.columns.read_id.take(self._selected_batch_rows)
        return self.columns.read_id

    @property
    def read_number_column(self) -> pa.UInt32Array:
        """
        Get the column of read numbers for this batch
        """
        if self._selected_batch_rows is not None:
            return self.columns.read_number.take(self._selected_batch_rows)
        return self.columns.read_number

    @property
    def cached_sample_count_column(self) -> npt.NDArray[np.uint64]:
        """
        Get the sample counts from the cached signal data
        """
        if not self._signal_cache:
            raise RuntimeError("No cached signal data available")
        return self._signal_cache.sample_count

    @property
    def cached_samples_column(self) -> List[npt.NDArray[np.int16]]:
        """
        Get the samples column from the cached signal data
        """
        if not self._signal_cache:
            raise RuntimeError("No cached signal data available")
        return self._signal_cache.samples


class ArrowTableHandle:
    """Class for managing arrow file handles and memory view mapping of tables"""

    def __init__(
        self,
        location: p5b.EmbeddedFileData,
        options: Optional[pa.ipc.IpcReadOptions] = None,
    ) -> None:
        """
        Open a pod5 file at the given `path` and use the location data to load
        an arrow table (e.g. signal table)

        Parameters
        ----------
        location : lib_pod5.pod5_format_pybind.EmbeddedFileData
            Location data for how a pod5 file should be spit in memory to read a table.
            This is returned from p5b.Pod5FileReader.get_file_X_location methods
        options: pa.ipc.IpcReadOptions
            Serialization options for reading IPC format.

        Raises
        ------
        Pod5ApiException
            If handle could not be opened
        """

        # The location data is passed from the p5b.Pod5FileReader.get_file_X_location
        # methods
        self._location = location
        self._options = options
        self._path = Path(self._location.file_path)

        self._fh: Union[BufferedReader, None] = None
        self._mmap: Union[mmap.mmap, None] = None
        self._reader: Union[pa.RecordBatchFileReader, None] = None
        self._stream: Union[pa.PythonFile, pa.NativeFile, None] = None

        self._fh = None
        if "POD5_DISABLE_MMAP_OPEN" in os.environ:
            self._stream = self._open_without_mmap()
        else:
            # Create a memory view of the file and select the region for the table
            try:
                self._stream = self._open_with_mmap()
            except OSError:
                # If we fail fall back to a traditional open.
                self._stream = self._open_without_mmap()

        self._reader = pa.ipc.open_file(self._stream, options=self._options)

    def _open_without_mmap(self) -> pa.PythonFile:
        class File(IOBase):
            def __init__(self, handle, location):
                self._handle = handle
                self._location = location
                self.seek(0, whence=0)

            def seek(self, position, whence=0):
                if whence == 0:
                    position = position + self._location.offset
                elif whence == 2:
                    position = (
                        self._location.offset + self._location.length
                    ) - position
                    whence = 0
                # The new abs location:
                abs_location = self._handle.seek(position, whence)

                return abs_location - self._location.offset

            def read(self, size=-1):
                return self._handle.read(size)

        if self._fh is None:
            self._fh = self._path.open("rb")

        return pa.PythonFile(File(self._fh, self._location))

    def _open_with_mmap(self) -> pa.BufferReader:
        loc = self._location
        # Get the page-aligned offset of this table.
        # If the inner file doesn't align to a page, get the offset to the
        # previous page and extend the length accordingly.
        alignment_remainder = loc.offset % mmap.ALLOCATIONGRANULARITY
        aligned_offset = loc.offset - alignment_remainder
        aligned_length = loc.length + alignment_remainder

        # Temporarily open file to reduce open file handles
        with self._path.open("rb") as fh:
            self._mmap = mmap.mmap(
                fh.fileno(),
                offset=aligned_offset,
                length=aligned_length,
                access=mmap.ACCESS_READ,
            )
            # Slice to remove any leading bytes which are not in the table
            # added from page-alignment
            arrow_table_view = memoryview(self._mmap)[alignment_remainder:]

        try:
            return pa.BufferReader(arrow_table_view)
        except pa.ArrowInvalid as exc:
            raise Pod5ApiException(f"Failed to open ArrowTable: {self._path}") from exc

    @property
    def reader(self) -> pa.ipc.RecordBatchFileReader:
        """Return the pyarrow file reader object"""
        if self._reader is not None:
            return self._reader

        raise RuntimeError(f"Could not open pyarrow reader: {p5b.get_error_string()}")

    @property
    def stream(self) -> Union[pa.PythonFile, pa.NativeFile]:
        """Return the pyarrow file stream / backend"""
        if self._stream is not None:
            return self._stream

        raise RuntimeError(f"Could not open pyarrow stream: {p5b.get_error_string()}")

    def close(self) -> None:
        """
        Cleanly close the open file handles and memory views.
        """
        safe_close(self, "_reader")
        self._reader = None

        safe_close(self, "_stream")
        self._stream = None

        safe_close(self, "_mmap")
        self._mmap = None

        safe_close(self, "_fh")
        self._fh = None

    def __enter__(self) -> "ArrowTableHandle":
        return self

    def __exit__(self, *exc_details) -> None:
        self.close()

    def __del__(self):
        self.close()


class Reader:
    """
    The base reader for POD5 data
    """

    def __init__(self, path: PathOrStr):
        """
        Open a pod5 filepath for reading
        """
        self._path = Path(path).absolute()

        self._file_reader: Optional[p5b.Pod5FileReader] = None
        self._read_handle: Optional[ArrowTableHandle] = None
        self._run_info_handle: Optional[ArrowTableHandle] = None
        self._signal_handle: Optional[ArrowTableHandle] = None

        (
            self._file_reader,
            self._read_handle,
            self._run_info_handle,
            self._signal_handle,
        ) = self._open_arrow_table_handles(self._path)

        schema_metadata = self.read_table.schema.metadata
        self._file_identifier = UUID(
            schema_metadata[b"MINKNOW:file_identifier"].decode("utf-8")
        )
        self._writing_software = schema_metadata[b"MINKNOW:software"].decode("utf-8")
        writing_version_str = schema_metadata[b"MINKNOW:pod5_version"].decode("utf-8")
        writing_version = packaging.version.parse(writing_version_str)

        self._columns_type = ReadRecordV4Columns
        self._reads_table_version = 4

        self._file_version = writing_version
        self._file_version_pre_migration = packaging.version.Version(
            self._file_reader.get_file_version_pre_migration()
        )

        # Warning: The cached signal maintains an open file handle. So ensure that
        # this dictionary is cleared before closing.
        self._cached_signal_batches: Dict[int, Signal] = {}
        self._cached_run_infos: Dict[str, RunInfo] = {}

        self._is_vbz_compressed: Optional[bool] = None
        self._signal_batch_row_count: Optional[int] = None

    @staticmethod
    def _open_arrow_table_handles(
        path: Path,
    ) -> Tuple[
        p5b.Pod5FileReader, ArrowTableHandle, ArrowTableHandle, ArrowTableHandle
    ]:
        """Open handles to the underlying arrow tables within this pod5 file"""
        if not path.is_file():
            raise FileNotFoundError(f"Failed to open pod5 file at: {path}")

        file_reader = p5b.open_file(str(path))
        if not file_reader:
            raise Pod5ApiException(
                f"Failed to open reader for {path} Reason: {p5b.get_error_string()}"
            )

        read_handle = ArrowTableHandle(file_reader.get_file_read_table_location())
        run_info_handle = ArrowTableHandle(
            file_reader.get_file_run_info_table_location()
        )
        signal_handle = ArrowTableHandle(file_reader.get_file_signal_table_location())
        return file_reader, read_handle, run_info_handle, signal_handle

    def __enter__(self) -> "Reader":
        return self

    def __exit__(self, *exc_details) -> None:
        self.close()

    def __iter__(self) -> Generator[ReadRecord, None, None]:
        """Iterate over all reads"""
        yield from self.reads()

    def close(self) -> None:
        """Close files handles"""

        safe_close(self, "_read_handle")
        self._read_handle = None

        safe_close(self, "_run_info_handle")
        self._run_info_handle = None

        safe_close(self, "_signal_handle")
        self._signal_handle = None

        safe_close(self, "_file_reader")
        self._file_reader = None

        # Explicitly clear this dictionary to close file handles used in cache
        self._cached_signal_batches = {}

    @property
    def path(self) -> Path:
        """Return the path to this pod5 file"""
        return self._path

    @property
    def inner_file_reader(self) -> p5b.Pod5FileReader:
        """Access the inner c_api Pod5FileReader - use with caution"""
        if self._file_reader is None:
            raise RuntimeError("Pod5FileReader has been closed!")
        return self._file_reader

    @property
    def read_table(self) -> pa.ipc.RecordBatchFileReader:
        """Access the pod5 read table"""
        if self._read_handle is None:
            raise RuntimeError("ArrowTableHandle has been closed!")
        return self._read_handle.reader

    @property
    def run_info_table(self) -> pa.ipc.RecordBatchFileReader:
        """Access the pod5 run_info table"""
        if self._run_info_handle is None:
            raise RuntimeError("ArrowTableHandle has been closed!")
        return self._run_info_handle.reader

    @property
    def signal_table(self) -> pa.ipc.RecordBatchFileReader:
        """Access the pod5 signal table - use with caution"""
        if self._signal_handle is None:
            raise RuntimeError("ArrowTableHandle has been closed!")
        return self._signal_handle.reader

    @property
    def file_version(self) -> packaging.version.Version:
        """The version of pod5 that originally generated this file, this is not updated when updating the file."""
        return self._file_version

    @property
    def file_version_pre_migration(self) -> packaging.version.Version:
        """The version of pod5 that is stored with the file on disk."""
        return self._file_version_pre_migration

    @property
    def writing_software(self) -> str:
        return self._writing_software

    @property
    def file_identifier(self) -> UUID:
        return self._file_identifier

    @property
    def reads_table_version(self) -> int:
        return self._reads_table_version

    @property
    def is_vbz_compressed(self) -> bool:
        """Return if this file's signal is compressed"""
        if self._is_vbz_compressed is None:
            self._is_vbz_compressed = self.signal_table.schema.field(
                "signal"
            ).type.equals(pa.large_binary())
        return self._is_vbz_compressed

    @property
    def signal_batch_row_count(self) -> int:
        """Return signal batch row count"""
        if self._signal_batch_row_count is None:
            if self.signal_table.num_record_batches > 0:
                self._signal_batch_row_count = self.signal_table.get_batch(0).num_rows
            else:
                self._signal_batch_row_count = 0
        return self._signal_batch_row_count

    @property
    def batch_count(self) -> int:
        """
        Find the number of read batches available in the file.
        """
        return self.read_table.num_record_batches

    @property
    def num_reads(self) -> int:
        """
        Find the number of reads in the file.
        """
        # We write constant size batches except for the last.
        num_batches = self.read_table.num_record_batches
        return (
            self.read_table.get_batch(0).num_rows * max(num_batches - 1, 0)
            + self.read_table.get_batch(num_batches - 1).num_rows
        )

    @property
    def read_ids_raw(self) -> pa.ChunkedArray:
        """
        Return chunked arrow array of read ids.

        To get read ids as string use `Reader.read_ids`
        """

        return pa.chunked_array([batch.read_id_column for batch in self.read_batches()])

    @property
    def read_ids(self) -> List[str]:
        """
        Return all read_ids as a list of strings.

        For the most performant implementation consider `Reader.read_ids_raw`
        """

        def arrow_to_numpy(batch):
            # Get the arrow data as a buffer
            id_buffer = batch.read_id_column.buffers()[1]

            # Pack the arrow buffer into a numpy array of the the right shape
            array = np.frombuffer(id_buffer, dtype=np.uint8)
            return array.reshape((batch.num_reads, 16))

        read_ids = np.concatenate(
            [arrow_to_numpy(batch) for batch in self.read_batches()]
        )
        return format_read_ids(read_ids)

    def get_batch(self, index: int) -> ReadRecordBatch:
        """
        Get a read batch in the file.

        Returns
        -------
        ReadRecordBatch
            The requested batch as a ReadRecordBatch.
        """
        return ReadRecordBatch(self, self.read_table.get_batch(index))

    def read_batches(
        self,
        selection: Optional[List[str]] = None,
        batch_selection: Optional[Iterable[int]] = None,
        missing_ok: bool = False,
        preload: Optional[Set[str]] = None,
    ) -> Generator[ReadRecordBatch, None, None]:
        """
        Iterate batches in the file, optionally selecting certain rows.

        Parameters
        ----------
        selection : iterable[str]
            The read ids to walk in the file.
        batch_selection : iterable[int]
            The read batches to walk in the file.
        missing_ok : bool
            If selection contains entries not found in the file, an error will be raised.
        preload : set[str]
            Columns to preload - "samples" and "sample_count" are valid values

        Returns
        -------
        Generator[ReadRecordBatch, None, None]
            A generator yielding `ReadRecordBatch`s
        """
        if selection is not None:
            if batch_selection is not None:
                raise ValueError("selection and batch_selection are mutually exclusive")
            yield from self._select_read_batches(
                selection, missing_ok=missing_ok, preload=preload
            )
        elif batch_selection is not None:
            assert not selection
            yield from self._read_some_batches(batch_selection, preload=preload)
        else:
            yield from self._reads_batches(preload=preload)

    def reads(
        self,
        selection: Optional[Iterable[str]] = None,
        missing_ok: bool = False,
        preload: Optional[Set[str]] = None,
    ) -> Generator[ReadRecord, None, None]:
        """
        Iterate reads in the file, optionally filtering for certain read ids.

        Parameters
        ----------
        selection : iterable[str]
            The read ids to walk in the file.
        missing_ok : bool
            If selection contains entries not found in the file, an error will be raised.
        preload : set[str]
            Columns to preload - "samples" and "sample_count" are valid values

        Returns
        -------
        Generator[ReadRecord, None, None]
            A generator yielding `ReadRecord`s
        """
        if selection is None:
            yield from self._reads(preload=preload)
        else:
            yield from self._select_reads(
                list(selection), missing_ok=missing_ok, preload=preload
            )

    def _reads(
        self, preload: Optional[Set[str]] = None
    ) -> Generator[ReadRecord, None, None]:
        """Generate all reads"""
        for batch in self.read_batches(preload=preload):
            for read in batch.reads():
                yield read

    def _select_reads(
        self,
        selection: List[str],
        missing_ok: bool = False,
        preload: Optional[Set[str]] = None,
    ) -> Generator[ReadRecord, None, None]:
        """Generate selected reads"""
        for batch in self._select_read_batches(selection, missing_ok, preload=preload):
            for read in batch.reads():
                yield read

    def _reads_batches(
        self, preload: Optional[Set[str]] = None
    ) -> Generator[ReadRecordBatch, None, None]:
        """Generate the record batches"""
        signal_cache = None
        if preload:
            signal_cache = self.inner_file_reader.batch_get_signal(
                "samples" in preload,
                "sample_count" in preload,
            )

        for idx in range(self.read_table.num_record_batches):
            batch = self.get_batch(idx)
            if signal_cache:
                batch.set_cached_signal(signal_cache.release_next_batch())
            yield batch

    def _read_some_batches(
        self,
        batch_selection: Iterable[int],
        preload: Optional[Set[str]] = None,
    ) -> Generator[ReadRecordBatch, None, None]:
        """Generate the selected record batches"""
        signal_cache = None
        if preload:
            signal_cache = self.inner_file_reader.batch_get_signal_batches(
                "samples" in preload,
                "sample_count" in preload,
                np.array(batch_selection, dtype=np.uint32),
            )

        for i in batch_selection:
            batch = self.get_batch(i)
            if signal_cache:
                batch.set_cached_signal(signal_cache.release_next_batch())
            yield batch

    def _select_read_batches(
        self,
        selection: List[str],
        missing_ok: bool = False,
        preload: Optional[Set[str]] = None,
    ) -> Generator[ReadRecordBatch, None, None]:
        """Generate the selected record batches"""
        successful_finds, per_batch_counts, batch_rows = self._plan_traversal(
            selection, missing_ok=missing_ok
        )

        if not missing_ok and successful_finds != len(selection):
            raise RuntimeError(
                f"Failed to find {len(selection) - successful_finds} requested reads in the file"
            )

        signal_cache: Optional[p5b.Pod5AsyncSignalLoader] = None
        if preload:
            signal_cache = self.inner_file_reader.batch_get_signal_selection(
                "samples" in preload,
                "sample_count" in preload,
                per_batch_counts,
                batch_rows,
            )

        current_offset = 0
        for batch_idx, batch_count in enumerate(per_batch_counts):
            current_batch_rows = batch_rows[
                current_offset : current_offset + batch_count
            ]
            current_offset += batch_count

            batch = self.get_batch(batch_idx)
            batch.set_selected_batch_rows(current_batch_rows)
            if signal_cache:
                batch.set_cached_signal(signal_cache.release_next_batch())
            yield batch

    def _plan_traversal(
        self,
        read_ids: Union[Collection[str], npt.NDArray[np.uint8]],
        missing_ok: bool = False,
    ) -> Tuple[int, npt.NDArray[np.uint32], npt.NDArray[np.uint32]]:
        """
        Query the file reader indexes to return the number of read_ids which
        were found and the batches and rows which are needed to traverse each
        read in the selection.

        Parameters
        ----------
        read_ids : Collection or numpy.ndarray of read_id strings
            The read ids to find in the file

        Returns
        -------
        successful_find_count: int
            The number of reads that were found from the array of read_ids given
        per_batch_counts: numpy.array[uint32]
            The number of rows from the batch row ids to take to form each RecordBatch
        batch_rows: numpy.array[uint32]
            All batch row ids

        """
        if not isinstance(read_ids, np.ndarray):
            read_ids = pack_read_ids(read_ids, invalid_ok=missing_ok)

        assert isinstance(read_ids, np.ndarray)

        batch_rows = np.empty(dtype="u4", shape=read_ids.shape[0])
        per_batch_counts = np.empty(dtype="u4", shape=self.batch_count)

        successful_find_count = self.inner_file_reader.plan_traversal(
            read_ids,
            per_batch_counts,
            batch_rows,
        )

        return successful_find_count, per_batch_counts, batch_rows

    def _get_signal_batch(self, batch_id: int) -> Signal:
        """Get the `Signal` from the signal_reader batch at batch_id"""
        if batch_id in self._cached_signal_batches:
            return self._cached_signal_batches[batch_id]

        batch = self.signal_table.get_batch(batch_id)

        signal_batch = Signal(*[batch.column(name) for name in Signal._fields])

        self._cached_signal_batches[batch_id] = signal_batch
        return signal_batch

    def _lookup_run_info(self, batch: ReadRecordBatch, batch_row_id: int) -> RunInfo:
        """Get the `RunInfo` from the batch at `batch_row_id`"""

        acquisition_id = batch.columns.run_info[batch_row_id].as_py()

        if acquisition_id in self._cached_run_infos:
            return self._cached_run_infos[acquisition_id]

        run_info = None
        for idx in range(self.run_info_table.num_record_batches):
            run_info_batch = self.run_info_table.get_batch(idx)
            acquisition_id_col = run_info_batch.column("acquisition_id")
            for row in range(run_info_batch.num_rows):
                if acquisition_id_col[row].as_py() == acquisition_id:
                    values = {}
                    for field in fields(RunInfo):
                        col = run_info_batch.column(field.name)
                        values[field.name] = col[row].as_py()

                        if field.name in ("tracking_id", "context_tags"):
                            values[field.name] = {k: v for k, v in values[field.name]}

                    run_info = RunInfo(**values)
                    break

        if not run_info:
            raise Exception(
                f"Failed to find run info '{acquisition_id}' in run info table"
            )

        self._cached_run_infos[acquisition_id] = run_info
        return run_info

    def __del__(self):
        self.close()


================================================
FILE: python/pod5/src/pod5/repack.py
================================================
"""
Tools to assist repacking pod5 data into other pod5 files
"""

from typing import Collection
import lib_pod5 as p5b

import pod5 as p5


class Repacker:
    """Wrapper class around native pod5 tools to repack data"""

    def __init__(self):
        self._repacker = p5b.Repacker()
        self._reads_requested = 0

    @property
    def is_complete(self) -> bool:
        """Find if the requested repack operations are complete"""
        return self._repacker.is_complete

    @property
    def currently_open_file_reader_count(self) -> int:
        """Returns the number of open file readers held by this repacker"""
        return self._repacker.currently_open_file_reader_count

    @property
    def reads_completed(self) -> int:
        """Find the number of reads written to files"""
        return self._repacker.reads_completed

    @property
    def reads_requested(self) -> int:
        """Find the number of requested reads to be written"""
        return self._reads_requested

    def add_output(
        self, output_file: p5.Writer, check_duplicate_read_ids: bool = True
    ) -> p5b.Pod5RepackerOutput:
        """
        Add an output file writer to the repacker, so it can have read data repacked
        into it.

        Once a user has added an output, it can be passed as an output
        to `add_selected_reads_to_output` or `add_reads_to_output`

        Parameters
        ----------
        output_file: Writer
            The output file writer to use
        check_duplicate_read_ids: bool
            Check the output for duplicate read ids, and raise an error if found.

        Returns
        -------
        repacker_object: p5b.Pod5RepackerOutput
            Use this as `output_ref` in calls to `add_selected_reads_to_output`
            or `add_reads_to_output`
        """
        assert output_file._writer is not None
        return self._repacker.add_output(output_file._writer, check_duplicate_read_ids)

    def add_selected_reads_to_output(
        self,
        output_ref: p5b.Pod5RepackerOutput,
        reader: p5.Reader,
        selected_read_ids: Collection[str],
    ):
        """
        Copy the selected read_ids from the given `Reader` into the
        Repacker output reference which was returned by `add_output`

        Parameters
        ----------
        output_ref : lib_pod5.pod5_format_pybind.Pod5RepackerOutput
            The repacker handle reference returned from `add_output`
        reader : Reader
            The Pod5 file reader to copy reads from
        selected_read_ids: Collection[str]
            A Collection of read_ids as strings

        Raises
        ------
        RuntimeError
            If any of the selected_read_ids were not found in the source file
        """

        successful_finds, per_batch_counts, all_batch_rows = reader._plan_traversal(
            selected_read_ids
        )

        if successful_finds != len(selected_read_ids):
            raise RuntimeError(
                f"Failed to find {len(selected_read_ids) - successful_finds} "
                "requested reads in the source file"
            )

        self._reads_requested += successful_finds
        self._repacker.add_selected_reads_to_output(
            output_ref, reader.inner_file_reader, per_batch_counts, all_batch_rows
        )

    def add_all_reads_to_output(
        self, output_ref: p5b.Pod5RepackerOutput, reader: p5.Reader
    ) -> None:
        """
        Copy the every read from the given `Reader` into the
        Repacker output reference which was returned by `add_output`

        Parameters
        ----------
        output_ref : lib_pod5.pod5_format_pybind.Pod5RepackerOutput
            The repacker handle reference returned from `add_output`
        reader : Reader
            The Pod5 file reader to copy reads from
        """
        self._reads_requested += reader.num_reads
        self._repacker.add_all_reads_to_output(output_ref, reader.inner_file_reader)

    def finish(self) -> None:
        """
        Call finish on the underlying c_api repacker instance to write the footer
        completing the file and freeing resources
        """
        return self._repacker.finish()

    def set_output_finished(self, output) -> None:
        """
        Tell the repacker a specific output is complete and can be finalised.
        """
        return self._repacker.set_output_finished(output)


================================================
FILE: python/pod5/src/pod5/signal_tools.py
================================================
"""
Tools for handling pod5 signals
"""

from typing import List, Tuple, Union

import lib_pod5 as p5b
import numpy as np
import numpy.typing as npt

DEFAULT_SIGNAL_CHUNK_SIZE = 102400


def vbz_decompress_signal(
    compressed_signal: Union[npt.NDArray[np.uint8], memoryview], sample_count: int
) -> npt.NDArray[np.int16]:
    """
    Decompress a contiguous (not-chunked) numpy array of compressed signal data

    Parameters
    ----------
    compressed_signal : numpy.ndarray[uint8]
        The array of compressed signal data to decompress.
    sample_count : int
        The number of samples in the original signal

    Returns
    -------
    A decompressed signal array numpy.ndarray[int16]
    """
    if len(compressed_signal) == 0:
        return np.array([], dtype=np.int16)

    signal = np.empty(sample_count, dtype="i2")
    p5b.decompress_signal(compressed_signal, signal)
    return signal


def vbz_decompress_signal_chunked(
    compressed_signal_chunks: List[npt.NDArray[np.uint8]], sample_counts: List[int]
) -> npt.NDArray[np.int16]:
    """
    Decompress a chunks of numpy array of compressed signal data

    Parameters
    ----------
    compressed_signal_chunks : List[numpy.ndarray[uint8]]
        A list of compressed signal data chunks to decompress.
    sample_counts : List[int]
        The number of samples in the original signal chunks

    Returns
    -------
    A decompressed signal array numpy.ndarray[int16]

    Raises
    ------
    ValueError
        Inconsistent parameter lengths
    """
    if len(compressed_signal_chunks) != len(sample_counts):
        raise ValueError(
            f"Inconsistent number of chunks to decompress - "
            f"signals: {len(compressed_signal_chunks)}, counts: {len(sample_counts)}"
        )

    if len(compressed_signal_chunks) == 0:
        return np.array([], dtype=np.int16)

    decompressed_signal: npt.NDArray[np.int16] = (
        np.concatenate(  # type:ignore [no-untyped-call]
            [
                vbz_decompress_signal(signal_chunk, sample_count)
                for signal_chunk, sample_count in zip(
                    compressed_signal_chunks, sample_counts
                )
            ]
        )
    )
    return decompressed_signal


def vbz_decompress_signal_into(
    compressed_signal: Union[npt.NDArray[np.uint8], memoryview],
    output_array: npt.NDArray[np.int16],
) -> npt.NDArray[np.int16]:
    """
    Decompress a numpy array of compressed signal data into the destination
    "output_array"

    Parameters
    ----------
    compressed_signal : numpy.ndarray[uint8]
        The array of compressed signal data to decompress.
    output_array : numpy.ndarray[int16]
        The destination location for signal

    Returns
    -------
    A decompressed signal array numpy.ndarray[int16]
    """
    if len(compressed_signal) == 0:
        return np.array([], dtype=np.int16)

    p5b.decompress_signal(compressed_signal, output_array)
    return output_array


def vbz_compress_signal(signal: npt.NDArray[np.int16]) -> npt.NDArray[np.uint8]:
    """
    Compress a numpy array of signal data

    Parameters
    ----------
    signal : numpy.ndarray[int16]
        The array of signal data to compress.

    Returns
    -------
    compressed_signal : numpy.array[uint8]
        The compressed signal data as a numpy.ndarray[uint8] (byte array)
    """
    if signal.size == 0:
        return np.array([], dtype=np.uint8)

    max_signal_size = p5b.vbz_compressed_signal_max_size(len(signal))
    compressed_signal = np.zeros(max_signal_size, dtype="u1")

    size = p5b.compress_signal(signal, compressed_signal)

    return np.resize(compressed_signal, size)


def vbz_compress_signal_chunked(
    signal: npt.NDArray[np.int16], signal_chunk_size: int = DEFAULT_SIGNAL_CHUNK_SIZE
) -> Tuple[List[npt.NDArray[np.uint8]], List[int]]:
    """
    Compress a numpy array of signal data into chunks

    Parameters
    ----------
    signal : numpy.ndarray[int16]
        The array of signal data to compress.
    signal_chunk_size : int
        The number of signal samples in a chunk

    Returns
    -------
    compressed_signal_chunks : List[numpy.array[uint8]]
        A List of chunks of compressed signal data as numpy.ndarray[uint8] (byte arrays)
    signal_chunk_lengths : List[int]
        The number of uncompressed signal samples in each chunk
    """
    signal_chunks: List[npt.NDArray[np.uint8]] = []
    signal_chunk_lengths: List[int] = []

    # Take slice views of the signal ndarray (non-copying)
    for slice_index in range(0, len(signal), signal_chunk_size):
        signal_slice = signal[slice_index : slice_index + signal_chunk_size]
        signal_chunks.append(vbz_compress_signal(signal_slice))
        signal_chunk_lengths.append(len(signal_slice))

    return signal_chunks, signal_chunk_lengths


================================================
FILE: python/pod5/src/pod5/tools/__init__.py
================================================
"""POD5 Format Tools"""


================================================
FILE: python/pod5/src/pod5/tools/main.py
================================================
"""Main entry point for pod5 tools"""

import argparse
import sys
from typing import Any

from pod5 import __version__
from pod5.tools.parsers import (
    SubcommandHelpFormatter,
    prepare_pod5_convert,
    prepare_pod5_filter_argparser,
    prepare_pod5_inspect_argparser,
    prepare_pod5_merge_argparser,
    prepare_pod5_recover_argparser,
    prepare_pod5_repack_argparser,
    prepare_pod5_subset_argparser,
    prepare_pod5_update_argparser,
    prepare_pod5_view_argparser,
    run_tool,
)


def main() -> Any:
    """
    The core pod5 tools function which assembles the argparser and executes the required
    pod5 tool.
    """
    desc = (
        "**********      POD5 Tools      **********\n\n"
        "Tools for inspecting, converting, subsetting and formatting POD5 files"
    )

    parser = argparse.ArgumentParser(
        prog="pod5",
        description=desc,
        epilog="Example: pod5 convert fast5 input.fast5 --output output.pod5",
        formatter_class=SubcommandHelpFormatter,
    )
    parser.add_argument(
        "-v",
        "--version",
        action="version",
        version="Pod5 version: {}".format(__version__),
        help="Show pod5 version and exit.",
    )
    parser.set_defaults(func=lambda **_: parser.print_help())

    root = parser.add_subparsers(title="sub-commands")

    # add sub-parsers to the root argparser
    prepare_pod5_convert(root)
    prepare_pod5_inspect_argparser(root)
    prepare_pod5_merge_argparser(root)
    prepare_pod5_repack_argparser(root)
    prepare_pod5_subset_argparser(root)
    prepare_pod5_filter_argparser(root)
    prepare_pod5_recover_argparser(root)
    prepare_pod5_update_argparser(root)
    prepare_pod5_view_argparser(root)

    # Run the tool
    return run_tool(parser)


if __name__ == "__main__":
    sys.exit(main())


================================================
FILE: python/pod5/src/pod5/tools/parsers.py
================================================
"""
Parsers for pod5 tools.

Each parser should have set_defaults(func=tool) called where tool is the core function
of a pod5 tool. These are commonly tool_pod5 (e.g. subset_pod5, merge_pod5)
"""

import argparse
import sys
from pathlib import Path
from typing import Any, Optional

from pod5.signal_tools import DEFAULT_SIGNAL_CHUNK_SIZE
from pod5.tools.utils import DEFAULT_THREADS, is_pod5_debug


class SubcommandHelpFormatter(
    argparse.RawDescriptionHelpFormatter,
    argparse.ArgumentDefaultsHelpFormatter,
):
    """
    Helper function to prettier print subcommand help. This removes some
    extra lines of output when a final command parser is not selected.
    """

    def _format_action(self, action):
        parts = super(SubcommandHelpFormatter, self)._format_action(action)
        if action.nargs == argparse.PARSER:
            parts = "\n".join(parts.split("\n")[1:])
        return parts


def run_tool(parser: argparse.ArgumentParser) -> Any:
    """Run the tool prepared by an argparser"""
    kwargs = vars(parser.parse_args())
    tool_func = kwargs.pop("func")
    try:
        return tool_func(**kwargs)
    except Exception as exc:
        if is_pod5_debug():
            raise exc
        print(f"\nPOD5 has encountered an error: '{exc}'", file=sys.stderr)
        print("\nFor detailed information set POD5_DEBUG=1'", file=sys.stderr)
        exit(1)


def add_recursive_argument(parser: argparse.ArgumentParser):
    parser.add_argument(
        "-r",
        "--recursive",
        default=False,
        action="store_true",
        help="Search for input files recursively matching `*.pod5`",
    )


def add_force_overwrite_argument(parser: argparse._ActionsContainer):
    parser.add_argument(
        "-f",
        "--force-overwrite",
        action="store_true",
        help="Overwrite destination files",
    )


#
# CONVERT - fast5
#
def pod5_convert_from_fast5_argparser(
    parent: Optional[argparse._SubParsersAction] = None,
) -> argparse.ArgumentParser:
    """
    Create an argument parser for the pod5 convert-from-fast5 tool
    """

    _desc = "Convert fast5 file(s) into a pod5 file(s)"

    if parent is None:
        parser = argparse.ArgumentParser(description=_desc)
    else:
        parser = parent.add_parser(
            name="fast5",
            aliases=["from_fast5"],
            description=_desc,
            formatter_class=SubcommandHelpFormatter,
        )

    parser.add_argument(
        "inputs", type=Path, nargs="+", help="Input path for fast5 file"
    )
    required_group = parser.add_argument_group("required arguments")
    required_group.add_argument(
        "-o",
        "--output",
        type=Path,
        required=True,
        help="Output path for the pod5 file(s). This can be an existing "
        "directory (creating 'output.pod5' within it) or a new named file path. "
        "A directory must be given when using --one-to-one.",
    )
    add_recursive_argument(parser)
    parser.add_argument(
        "-t",
        "--threads",
        default=DEFAULT_THREADS,
        type=int,
        help="Set the number of threads to use",
    )
    parser.add_argument(
        "--strict",
        action="store_true",
        help="Immediately quit if an exception is encountered during conversion "
        "instead of continuing with remaining inputs after issuing a warning",
    )
    output_group = parser.add_argument_group("output control arguments")
    output_group.add_argument(
        "-O",
        "--one-to-one",
        type=Path,
        default=None,
        help="Output files are written 1:1 to inputs. 1:1 output files are "
        "written to the output directory in a new directory structure relative to the "
        "directory path provided to this argument. This directory path must be a "
        "relative parent of all inputs.",
    )
    add_force_overwrite_argument(output_group)
    output_group.add_argument(
        "--signal-chunk-size",
        default=DEFAULT_SIGNAL_CHUNK_SIZE,
        help="Chunk size to use for signal data set",
        type=int,
    )

    def run(**kwargs):
        from pod5.tools.pod5_convert_from_fast5 import convert_from_fast5

        return convert_from_fast5(**kwargs)

    parser.set_defaults(func=run)

    return parser


#
# CONVERT - to_fast5
#
def pod5_convert_to_fast5_argparser(
    parent: Optional[argparse._SubParsersAction] = None,
) -> argparse.ArgumentParser:
    """
    Create an argument parser for the pod5 convert-to-fast5 tool
    """
    _desc = "Convert pod5 file(s) into fast5 file(s)"
    if parent is None:
        parser = argparse.ArgumentParser(description=_desc)
    else:
        parser = parent.add_parser(
            name="to_fast5",
            description=_desc,
            formatter_class=SubcommandHelpFormatter,
        )

    parser.add_argument("inputs", type=Path, nargs="+")
    required_group = parser.add_argument_group("required arguments")
    required_group.add_argument(
        "-o",
        "--output",
        type=Path,
        required=True,
        help="Output path for the pod5 file(s). This can be an existing "
        "directory (creating 'output.pod5' within it) or a new named file path. "
        "A directory must be given when using --one-to-one.",
    )
    add_recursive_argument(parser)
    parser.add_argument(
        "-t",
        "--threads",
        default=DEFAULT_THREADS,
        type=int,
        help="How many file writers to keep active",
    )
    output_group = parser.add_argument_group("output control arguments")
    add_force_overwrite_argument(output_group)
    output_group.add_argument(
        "--file-read-count",
        default=4000,
        type=int,
        help="Number of reads to write per file.",
    )

    def run(**kwargs):
        from pod5.tools.pod5_convert_to_fast5 import convert_to_fast5

        return convert_to_fast5(**kwargs)

    parser.set_defaults(func=run)

    return parser


#
# CONVERT - root
#
def prepare_pod5_convert(parent: argparse._SubParsersAction) -> argparse.ArgumentParser:
    """Create an argument paraser for the pod5 convert entry point"""

    _desc = "File conversion tools"

    convert_parser = parent.add_parser(
        name="convert",
        description=_desc,
        epilog="Example: pod5 convert fast5 input.fast5 --output output.pod5",
        formatter_class=SubcommandHelpFormatter,
    )
    convert_parser.set_defaults(func=lambda x: convert_parser.print_help())

    sub_convert_parser = convert_parser.add_subparsers(title="conversion type")

    pod5_convert_from_fast5_argparser(sub_convert_parser)
    pod5_convert_to_fast5_argparser(sub_convert_parser)

    return convert_parser


#
# Filter
#
def prepare_pod5_filter_argparser(
    parent: Optional[argparse._SubParsersAction] = None,
) -> argparse.ArgumentParser:
    """Create an argument parser for the pod5 filter tool"""

    _desc = "Take a subset of reads using a list of read_ids from one or more inputs"
    if parent is None:
        parser = argparse.ArgumentParser(description=_desc)
    else:
        parser = parent.add_parser(
            name="filter",
            description=_desc,
            epilog="Example: pod5 filter inputs*.pod5 --ids read_ids.txt --output filtered.pod5",
        )

    # Core arguments
    parser.add_argument(
        "inputs", type=Path, nargs="+", help="Pod5 filepaths to use as inputs"
    )
    add_recursive_argument(parser)
    add_force_overwrite_argument(parser)

    required_group = parser.add_argument_group("required arguments")
    required_group.add_argument(
        "-i",
        "--ids",
        type=Path,
        required=True,
        help="A file containing a list of only valid read ids to filter from inputs",
    )
    required_group.add_argument(
        "-o",
        "--output",
        type=Path,
        required=True,
        help="Destination output filename",
    )
    parser.add_argument(
        "-t",
        "--threads",
        type=int,
        default=DEFAULT_THREADS,
        help="Number of workers",
    )

    content_group = parser.add_argument_group("content settings")
    content_group.add_argument(
        "-M",
        "--missing-ok",
        action="store_true",
        help="Allow missing read_ids",
    )

    def run(**kwargs):
        from pod5.tools.pod5_filter import filter_pod5

        return filter_pod5(**kwargs)

    parser.set_defaults(func=run)

    return parser


#
# Inspect
#
def prepare_pod5_inspect_argparser(
    parent: Optional[argparse._SubParsersAction] = None,
) -> argparse.ArgumentParser:
    """Create an argument parser for the pod5 inspect tool"""

    _desc = "Inspect the contents of a pod5 file"
    if parent is None:
        parser = argparse.ArgumentParser(description=_desc)
    else:
        parser = parent.add_parser(
            name="inspect",
            description=_desc,
            epilog="Example: pod5 inspect reads input.pod5",
        )

    def run(**kwargs):
        from pod5.tools.pod5_inspect import inspect_pod5

        return inspect_pod5(**kwargs)

    subparser = parser.add_subparsers(title="command", dest="command")
    summary_parser = subparser.add_parser(
        "summary",
        description="Print a summary of the contents of pod5 files",
        epilog="Example: pod5 inspect summary input.pod5",
    )
    summary_parser.add_argument("input_files", type=Path, nargs="+")
    summary_parser.set_defaults(func=run)

    reads_parser = subparser.add_parser(
        "reads",
        description="Print read information on all reads as a csv table",
        epilog="Example: pod5 inspect reads input.pod5",
    )
    reads_parser.add_argument("input_files", type=Path, nargs="+")
    add_recursive_argument(reads_parser)
    reads_parser.set_defaults(func=run)

    read_parser = subparser.add_parser(
        "read",
        description="Print detailed read information for a named read id",
        epilog="Example: pod5 inspect read input.pod5 0000173c-bf67-44e7-9a9c-1ad0bc728e74",
    )
    read_parser.add_argument("input_files", type=Path, nargs=1)
    read_parser.add_argument("read_id", type=str)
    read_parser.set_defaults(func=run, recursive=False)

    debug_parser = subparser.add_parser(
        "debug",
        description="Print debugging information",
        epilog="Example: pod5 inspect debug input.pod5",
    )
    debug_parser.add_argument("input_files", type=Path, nargs=1)
    debug_parser.set_defaults(func=run)

    return parser


#
# MERGE
#
def prepare_pod5_merge_argparser(
    parent: Optional[argparse._SubParsersAction] = None,
) -> argparse.ArgumentParser:
    """Create an argument parser for the pod5 merge tool"""

    _desc = "Merge multiple pod5 files"

    if parent is None:
        parser = argparse.ArgumentParser(description=_desc)
    else:
        parser = parent.add_parser(
            name="merge",
            description=_desc,
            formatter_class=SubcommandHelpFormatter,
            epilog="Example: pod5 merge inputs/*.pod5 merged.pod5",
        )

    # Core arguments
    parser.add_argument(
        "inputs",
        type=Path,
        nargs="+",
        help="Pod5 filepaths to use as inputs",
    )
    parser.add_argument(
        "-o",
        "--output",
        required=True,
        type=Path,
        help="Output filepath",
    )
    add_recursive_argument(parser)
    add_force_overwrite_argument(parser)
    parser.add_argument(
        "-t",
        "--threads",
        type=int,
        default=DEFAULT_THREADS,
        help="Number of workers",
    )
    parser.add_argument(
        "-R",
        "--readers",
        type=int,
        default=20,
        help="number of merge readers TESTING ONLY",
    )

    def run(**kwargs):
        from pod5.tools.pod5_merge import merge_pod5

        return merge_pod5(**kwargs)

    parser.set_defaults(func=run)
    return parser


#
# Repack
#
def prepare_pod5_repack_argparser(
    parent: Optional[argparse._SubParsersAction] = None,
) -> argparse.ArgumentParser:
    """Create an argument parser for the pod5 repack tool"""

    _desc = "Repack a pod5 files into a single output"
    if parent is None:
        parser = argparse.ArgumentParser(description=_desc)
    else:
        parser = parent.add_parser(
            name="repack",
            description=_desc,
            epilog="Example: pod5 repack inputs/*.pod5 repacked/",
        )

    parser.add_argument(
        "inputs", type=Path, nargs="+", help="Input pod5 file(s) to repack"
    )
    parser.add_argument(
        "-o", "--output", type=Path, help="Output directory for pod5 files"
    )
    add_recursive_argument(parser)
    add_force_overwrite_argument(parser)
    parser.add_argument(
        "-t",
        "--threads",
        type=int,
        default=DEFAULT_THREADS,
        help="Number of repacking workers",
    )

    def run(**kwargs):
        from pod5.tools.pod5_repack import repack_pod5

        return repack_pod5(**kwargs)

    parser.set_defaults(func=run)
    return parser


#
# Subset
#
def prepare_pod5_subset_argparser(
    parent: Optional[argparse._SubParsersAction] = None,
) -> argparse.ArgumentParser:
    """Create an argument parser for the pod5 subset tool"""

    _desc = (
        "Given one or more pod5 input files, take subsets of reads "
        "into one or more pod5 output files by a user-supplied mapping."
    )
    if parent is None:
        parser = argparse.ArgumentParser(description=_desc)
    else:
        parser = parent.add_parser(
            name="subset",
            description=_desc,
            formatter_class=SubcommandHelpFormatter,
            epilog="Example: pod5 subset inputs.pod5 --output subset_mux/ "
            "--summary summary.tsv --columns mux",
        )

    # Core arguments
    parser.add_argument(
        "inputs", type=Path, nargs="+", help="Pod5 filepaths to use as inputs"
    )
    parser.add_argument(
        "-o",
        "--output",
        type=Path,
        default=Path.cwd(),
        help="Destination directory to write outputs",
    )
    add_recursive_argument(parser)
    add_force_overwrite_argument(parser)
    parser.add_argument(
        "-t",
        "--threads",
        type=int,
        default=DEFAULT_THREADS,
        help="Number of subsetting workers",
    )

    mapping_group = parser.add_argument_group("direct mapping")
    mapping_exclusive = mapping_group.add_mutually_exclusive_group(required=False)
    mapping_exclusive.add_argument(
        "--csv",
        type=Path,
        help="CSV file mapping output filename to read ids",
    )

    table_group = parser.add_argument_group("table mapping")

    # Allow --summary or --table
    table_group.add_argument(
        "-s",
        "--summary",
        "--table",
        type=Path,
        help="Table filepath (csv or tsv)",
        dest="table",
    )
    table_group.add_argument(
        "-R",
        "--read-id-column",
        type=str,
        default="read_id",
        help="Name of the read_id column in the summary",
    )
    table_group.add_argument(
        "-c",
        "--columns",
        type=str,
        nargs="+",
        help="Names of --summary / --table columns to subset on",
    )
    table_group.add_argument(
        "--template",
        type=str,
        default=None,
        help="template string to generate output filenames "
        '(e.g. "mux-{mux}_barcode-{barcode}.pod5"). '
        "default is to concatenate all columns to values as shown in the example.",
    )
    table_group.add_argument(
        "-T",
        "--ignore-incomplete-template",
        action="store_true",
        default=None,
        help="Suppress the exception raised if the --template string does not contain "
        "every --columns key",
    )

    content_group = parser.add_argument_group("content settings")
    content_group.add_argument(
        "-M",
        "--missing-ok",
        action="store_true",
        help="Allow missing read_ids",
    )

    def run(**kwargs):
        from pod5.tools.pod5_subset import subset_pod5

        return subset_pod5(**kwargs)

    parser.set_defaults(func=run)

    return parser


#
# Recover
#
def prepare_pod5_recover_argparser(
    parent: Optional[argparse._SubParsersAction] = None,
) -> argparse.ArgumentParser:
    """Create an argument parser for the pod5 recover tool"""

    _desc = (
        "Attempt to recover pod5 files. Recovered files are written "
        "to sibling files with the '_recovered.pod5` suffix"
    )
    if parent is None:
        parser = argparse.ArgumentParser(description=_desc)
    else:
        parser = parent.add_parser(name="recover", description=_desc)

    parser.add_argument(
        "--cleanup",
        action="store_true",
        help="Delete successfully recovered input files and files with no data to recover.",
    )

    parser.add_argument(
        "inputs", type=Path, nargs="+", help="Input pod5 file(s) to update"
    )

    add_recursive_argument(parser)
    add_force_overwrite_argument(parser)

    def run(**kwargs) -> Any:
        from pod5.tools.pod5_recover import recover_pod5

        return recover_pod5(**kwargs)

    parser.set_defaults(func=run)

    return parser


#
# Update
#
def prepare_pod5_update_argparser(
    parent: Optional[argparse._SubParsersAction] = None,
) -> argparse.ArgumentParser:
    """Create an argument parser for the pod5 update tool"""

    _desc = "Update a pod5 files to the latest available version"
    if parent is None:
        parser = argparse.ArgumentParser(description=_desc)
    else:
        parser = parent.add_parser(
            name="update",
            description=_desc,
            formatter_class=SubcommandHelpFormatter,
        )

    parser.add_argument(
        "inputs", type=Path, nargs="+", help="Input pod5 file(s) to update"
    )
    parser.add_argument(
        "-o",
        "--output",
        type=Path,
        help="Output directory for updated pod5 files",
        required=True,
    )

    add_recursive_argument(parser)
    add_force_overwrite_argument(parser)

    def run(**kwargs) -> Any:
        from pod5.tools.pod5_update import update_pod5

        return update_pod5(**kwargs)

    parser.set_defaults(func=run)

    return parser


#
# View
#
def prepare_pod5_view_argparser(
    parent: Optional[argparse._SubParsersAction] = None,
) -> argparse.ArgumentParser:
    """Create an argument parser for the pod5 view tool"""

    _desc = """
    Write contents of some pod5 file(s) as a table to stdout or --output if given.
    The default separator is <tab>.
    The column order is always as shown in -L/--list-fields"
    """

    if parent is None:
        parser = argparse.ArgumentParser(description=_desc)
    else:
        parser = parent.add_parser(
            name="view",
            description=_desc,
            epilog="Example: pod5 view input.pod5",
            formatter_class=SubcommandHelpFormatter,
        )

    parser.add_argument(
        "inputs", type=Path, nargs="*", help="Input pod5 file(s) to view"
    )

    parser.add_argument(
        "-o", "--output", type=Path, default=None, help="Output filename"
    )
    add_recursive_argument(parser)
    add_force_overwrite_argument(parser)
    parser.add_argument(
        "-t",
        "--threads",
        default=DEFAULT_THREADS,
        type=int,
        help="Set the number of reader workers",
    )
    format_group = parser.add_argument_group("Formatting")
    format_group.add_argument(
        "-H", "--no-header", action="store_true", help="Omit the header line"
    )
    format_group.add_argument(
        "--separator",
        default="\t",
        help="Table separator character (e.g. ',')",
        type=str,
    )

    selection = parser.add_argument_group("Selection")
    selection.add_argument(
        "-I",
        "--ids",
        action="store_true",
        help="Only write 'read_id' field",
        dest="group_read_id",
    )
    selection.add_argument(
        "-i",
        "--include",
        type=str,
        help="Include a double-quoted comma-separated list of fields",
    )
    selection.add_argument(
        "-x",
        "--exclude",
        type=str,
        help="Exclude a double-quoted comma-separated list of fields.",
    )

    help_group = parser.add_argument_group("List Fields")
    help_group.add_argument(
        "-L",
        "--list-fields",
        action="store_true",
        help="List all groups and fields available for selection and exit",
    )

    def run(**kwargs):
        from pod5.tools.pod5_view import view_pod5

        return view_pod5(**kwargs)

    parser.set_defaults(func=run)

    return parser


================================================
FILE: python/pod5/src/pod5/tools/pod5_convert_from_fast5.py
================================================
"""
Tool for converting fast5 files to the pod5 format
"""

import datetime
import multiprocessing as mp
from multiprocessing.context import SpawnContext
import sys
import warnings
from pod5.pod5_types import CompressedRead
from tqdm.auto import tqdm
import uuid
from pathlib import Path
from queue import Empty
from typing import (
    Any,
    Collection,
    Dict,
    Iterable,
    List,
    Optional,
    Sequence,
    Tuple,
    Union,
)

import h5py
import iso8601
import more_itertools
import vbz_h5py_plugin  # noqa: F401

import pod5 as p5
from pod5.signal_tools import DEFAULT_SIGNAL_CHUNK_SIZE, vbz_compress_signal_chunked
from pod5.tools.parsers import pod5_convert_from_fast5_argparser, run_tool
from pod5.tools.utils import (
    DEFAULT_THREADS,
    PBAR_DEFAULTS,
    collect_inputs,
    init_logging,
    limit_threads,
    logged,
    logged_all,
    terminate_processes,
)

READ_CHUNK_SIZE = 400
TIMEOUT_SECONDS = 600


logger = init_logging()


class QueueManager:
    def __init__(
        self,
        context: SpawnContext,
        inputs: Collection[Path],
        threads: int,
        timeout: float,
    ) -> None:
        """Manager for balancing work queues"""
        self._requests_size = threads * 2
        self._inputs: mp.Queue = context.Queue(maxsize=len(inputs))
        self._requests: mp.Queue = context.Queue(maxsize=self._requests_size)
        self._data: mp.Queue = context.Queue()
        self._exceptions: mp.Queue = context.Queue()
        self._timeout = timeout

        self._start(inputs=inputs)

    def _await(self, queue: mp.Queue) -> Any:
        """Await the next item on a queue raising TimeoutError if failing"""
        try:
            item = queue.get(timeout=self._timeout)
            return item
        except Empty:
            logger.fatal("Empty queue or timeout ")
            raise TimeoutError(f"No progress in {self._timeout} seconds - quitting")

    def enqueue_request(self) -> None:
        self._requests.put(None, timeout=self._timeout)

    def await_request(self) -> None:
        """Await a request for data"""
        self._await(self._requests)

    @logged()
    def enqueue_data(
        self, path: Optional[Path], reads: Union[List[CompressedRead], int, None]
    ) -> None:
        """
        Enqueues an input path and either a list of compressed reads to be written, or
        the total count of reads converted for that path.
        Otherwise, if path is None, mark the child process as being empty.
        """
        self._data.put((path, reads), timeout=self._timeout)

    @logged(log_time=True)
    def await_data(
        self,
    ) -> Tuple[Optional[Path], Union[List[CompressedRead], int, None]]:
        """
        Await compressed reads or the total count of reads compressed (file end) for
        a input filepath. Enqueues the next request if necessary
        """
        path, item = self._await(self._data)

        # Check for the exhausted process sentinel value
        if path is None:
            return None, None

        # Add another request if we received compressed reads
        if isinstance(item, List):
            self.enqueue_request()

        return path, item

    @logged(log_args=True)
    def enqueue_exception(self, path: Path, exception: Exception, trace: str) -> None:
        self._exceptions.put((path, exception, trace), timeout=self._timeout)

    def get_exception(self) -> Optional[Tuple[Path, Exception, str]]:
        """Promptly get an exception if any"""
        try:
            # Use short timeout instead of get_nowait as we might call this method
            # very shortly after enqueueing an exception
            path, exc, trace = self._exceptions.get(timeout=0.01)
            logger.exception(f"Encountered an exception in {path} - {exc}")
            if trace:
                logger.exception(f"Trace Exception {path}\n{trace}")
            return path, exc, trace
        except Empty:
            pass
        return None

    @logged(log_args=True)
    def enqueue_input(self, path: Path) -> None:
        """Enqueue a request"""
        self._inputs.put(path)

    @logged_all
    def get_input(self) -> Optional[Path]:
        """Promptly get an input if any returning None if queue is empty"""
        try:
            return self._inputs.get(timeout=0.1)
        except Empty:
            pass
        return None

    @logged(log_return=True)
    def _discard_and_close(self, queue: mp.Queue) -> int:
        """
        Discard all remaining enqueued items and close a queue to nicely shutdown the
        queue. Returns the number of discarded items
        """
        count = 0
        while True:
            try:
                queue.get(timeout=0.1)
                count += 1
            except Exception:
                break
        queue.close()
        queue.join_thread()
        return count

    @logged(log_return=True)
    def shutdown(self) -> Tuple[int, int, int, int]:
        """Shutdown all queues returning the counts of all remaining items"""
        n_inputs = self._discard_and_close(self._inputs)
        n_req = self._discard_and_close(self._requests)
        n_data = self._discard_and_close(self._data)
        n_exc = self._discard_and_close(self._exceptions)

        if n_inputs > 0:
            logger.warn("Unfinished inputs found during shutdown!")
        if n_data > 0:
            logger.warn("Unfinished data found during shutdown!")
        if n_exc > 0:
            logger.warn("Unfinished exceptions found during shutdown!")

        return n_inputs, n_req, n_data, n_exc

    @logged(log_args=True)
    def _start(self, inputs: Iterable[Path]) -> None:
        """Enqueue all inputs for child processes to poll and set the requests size"""
        for path in inputs:
            if path.is_file():
                self.enqueue_input(path)

        for _ in range(self._requests_size):
            self.enqueue_request()


class OutputHandler:
    """Class for managing p5.Writer handles"""

    @logged(log_args=True)
    def __init__(
        self,
        output_root: Path,
        one_to_one: Optional[Path],
        force_overwrite: bool,
    ):
        self.output_root = output_root
        self._one_to_one = one_to_one
        self._force_overwrite = force_overwrite
        self._input_to_output: Dict[Path, Path] = {}
        self._open_writers: Dict[Path, p5.Writer] = {}
        self._closed_writers: Dict[Path, bool] = {}

    @logged_all
    def _open_writer(self, output_path: Path) -> Optional[p5.Writer]:
        """Get the writer from existing handles or create a new one if unseen"""
        if output_path in self._open_writers:
            return self._open_writers[output_path]

        if output_path in self._closed_writers:
            had_exception = self._closed_writers[output_path]
            if had_exception:
                return None
            raise FileExistsError(f"Trying to re-open a closed Writer to {output_path}")

        if output_path.exists() and self._force_overwrite:
            output_path.unlink()

        writer = p5.Writer(output_path)
        self._open_writers[output_path] = writer
        return writer

    @logged_all
    def get_writer(self, input_path: Path) -> Optional[p5.Writer]:
        """Get a Pod5Writer to write data from the input_path"""
        if input_path not in self._input_to_output:
            out_path = self.resolve_output_path(
                path=input_path, root=self.output_root, relative_root=self._one_to_one
            )
            self._input_to_output[input_path] = out_path

        output_path = self._input_to_output[input_path]
        return self._open_writer(output_path=output_path)

    @staticmethod
    @logged_all
    def resolve_one_to_one_path(path: Path, root: Path, relative_root: Path):
        """
        Find the relative path between the input path and the relative root
        """
        try:
            relative = path.with_suffix(".pod5").relative_to(relative_root)
        except ValueError as exc:
            raise RuntimeError(
                f"--one-to-one directory must be a relative parent of "
                f"all input fast5 files. For {path} relative to {relative_root}"
            ) from exc

        # Resolve the new final output path relative to the output directory
        # This path is to a file with the equivalent filename(.pod5)
        return root / relative

    @staticmethod
    @logged_all
    def resolve_output_path(
        path: Path, root: Path, relative_root: Optional[Path]
    ) -> Path:
        """
        Resolve the output path. If relative_root is a path, resolve the relative output
        path under root, otherwise, the output is either root or a new file within root
        if root is a directory
        """
        if relative_root is not None:
            # Resolve the relative path to the one_to_one root path
            out_path = OutputHandler.resolve_one_to_one_path(
                path=path,
                root=root,
                relative_root=relative_root,
            )

            # Create directory structure if needed
            out_path.parent.mkdir(parents=True, exist_ok=True)
            return out_path

        if root.is_dir():
            # If the output path is a directory, the write the default filename
            return root / "output.pod5"

        # The provided output path is assumed to be a named file
        return root

    @logged(log_args=True)
    def set_input_complete(self, input_path: Path, is_exception: bool) -> None:
        """Close the Pod5Writer for associated input_path"""
        if not self._one_to_one:
            # Do not close common output file when not in 1-2-1 mode
            return

        if input_path not in self._input_to_output:
            return

        output_path = self._input_to_output[input_path]
        self._open_writers[output_path].close()
        self._closed_writers[output_path] = is_exception
        del self._open_writers[output_path]

    @logged()
    def close_all(self):
        """Close all open writers"""
        for path, writer in self._open_writers.items():
            try:
                writer.close()
                del writer
                # Keep track of closed writers to ensure we don't overwrite our own work
                self._closed_writers[path] = False
            except Exception as exc:
                logger.debug(f"Failed to cleanly close writer to {path} - {exc}")
        self._open_writers = {}


class StatusMonitor:
    """Class for monitoring the status of the conversion"""

    @logged_all
    def __init__(self, paths: Sequence[Path]):
        # Estimate that a fast5 file will have 4k reads
        self.path_reads = {path: 4000 for path in paths}
        self.count_finished = 0

        self.pbar = tqdm(
            total=self.total_reads,
            desc=f"Converting {len(self.path_reads)} Fast5s",
            unit="Reads",
            leave=True,
            **PBAR_DEFAULTS,
        )

    @property
    def total_files(self) -> int:
        return len(self.path_reads)

    @property
    def total_reads(self) -> int:
        return sum(self.path_reads.values())

    @logged(log_args=True)
    def increment_reads(self, n: int) -> None:
        """Increment the reads status by n"""
        self.pbar.update(n)

    @logged(log_args=True)
    def update_reads_total(self, path: Path, total: int) -> None:
        """Increment the reads status by n and update the total reads"""
        self.path_reads[path] = total
        self.pbar.total = self.total_reads
        self.pbar.refresh()

    @logged(log_args=True)
    def write(self, msg: str, file: Any) -> None:
        """Write runtime message to avoid clobbering tqdm pbar"""
        self.pbar.write(msg, file=file)

    @logged()
    def close(self) -> None:
        """Close the progress bar"""
        self.pbar.close()


@logged_all
def is_multi_read_fast5(path: Path) -> bool:
    """
    Assert that the given path points to a a multi-read fast5 file for which
    direct-to-pod5 conversion is supported.
    """
    try:
        with h5py.File(path) as _h5:
            # The "file_type" attribute might be present on supported multi-read fast5 files.
            if _h5.attrs.get("file_type") == "multi-read":
                return True

            # No keys, assume multi-read but there shouldn't be anything to do which would
            # cause an issue so pass silently
            if len(_h5) == 0:
                return True

            # if there are "read_x" keys, this is a multi-read file
            if any(key for key in _h5 if key.startswith("read_")):
                return True

    except Exception:
        pass

    return False


def decode_str(value: Union[str, bytes]) -> str:
    """Decode a h5py utf-8 byte string to python string"""
    if isinstance(value, str):
        return value
    return value.decode("utf-8")


def convert_fast5_end_reason(fast5_end_reason: int) -> p5.EndReason:
    """
    Return an EndReason instance from the given end_reason integer from a fast5 file.
    This will handle the difference between fast5 and pod5 values for this enumeration
    and set the default "forced" value for each fast5 enumeration value.
    """
    # Expected fast5 enumeration:
    # end_reason_dict = {
    #     "unknown": 0,
    #     "partial": 1, <-- Not used in pod5
    #     "mux_change": 2,  <-- Remaining values are offset by +1
    #     "unblock_mux_change": 3,
    #     "data_service_unblock_mux_change": 4,
    #     "signal_positive": 5,
    #     "signal_negative": 6,
    # }

    # (0:unknown | 1:partial) => pod5 (0:unknown)
    if fast5_end_reason < 2:
        return p5.EndReason.from_reason_with_default_forced(p5.EndReasonEnum.UNKNOWN)

    # Resolve the offset in enumeration values between both files
    p5_scaled_end_reason = fast5_end_reason - 1
    return p5.EndReason.from_reason_with_default_forced(
        p5.EndReasonEnum(p5_scaled_end_reason)
    )


def convert_datetime_as_epoch_ms(
    time_str: Union[str, bytes, None],
) -> datetime.datetime:
    """Convert the fast5 time string to timestamp"""
    epoch = datetime.datetime.utcfromtimestamp(0).replace(tzinfo=datetime.timezone.utc)
    if time_str is None:
        return epoch
    try:
        return iso8601.parse_date(decode_str(time_str))
    except iso8601.iso8601.ParseError:
        return epoch


def convert_run_info(
    acq_id: str,
    adc_max: int,
    adc_min: int,
    sample_rate: int,
    context_tags: Dict[str, Union[str, bytes]],
    device_type: str,
    tracking_id: Dict[str, Union[str, bytes]],
) -> p5.RunInfo:
    """Create a Pod5RunInfo instance from parsed fast5 data"""
    return p5.RunInfo(
        acquisition_id=acq_id,
        acquisition_start_time=convert_datetime_as_epoch_ms(
            tracking_id.get("exp_start_time")
        ),
        adc_max=adc_max,
        adc_min=adc_min,
        context_tags={
            str(key): decode_str(value) for key, value in context_tags.items()
        },
        experiment_name="",
        flow_cell_id=decode_str(tracking_id.get("flow_cell_id", b"")),
        flow_cell_product_code=decode_str(
            tracking_id.get("flow_cell_product_code", b"")
        ),
        protocol_name=decode_str(tracking_id.get("exp_script_name", b"")),
        protocol_run_id=decode_str(tracking_id.get("protocol_run_id", b"")),
        protocol_start_time=convert_datetime_as_epoch_ms(
            tracking_id.get("protocol_start_time", None)
        ),
        sample_id=decode_str(tracking_id.get("sample_id", b"")),
        sample_rate=sample_rate,
        sequencing_kit=decode_str(context_tags.get("sequencing_kit", b"")),
        sequencer_position=decode_str(tracking_id.get("device_id", b"")),
        sequencer_position_type=decode_str(tracking_id.get("device_type", device_type)),
        software="python-pod5-converter",
        system_name=decode_str(tracking_id.get("host_product_serial_number", b"")),
        system_type=decode_str(tracking_id.get("host_product_code", b"")),
        tracking_id={str(key): decode_str(value) for key, value in tracking_id.items()},
    )


def convert_fast5_read(
    fast5_read: h5py.Group,
    run_info_cache: Dict[str, p5.RunInfo],
    signal_chunk_size: int = DEFAULT_SIGNAL_CHUNK_SIZE,
) -> p5.CompressedRead:
    """
    Given a fast5 read parsed from a fast5 file, return a pod5.Read object.
    """
    channel_id = fast5_read["channel_id"]
    raw = fast5_read["Raw"]

    attrs = fast5_read.attrs

    # Get the acquisition id
    if "run_id" in attrs:
        acq_id = decode_str(attrs["run_id"])
    else:
        acq_id = decode_str(fast5_read["tracking_id"].attrs["run_id"])

    # Create new run_info if we've not seen this acquisition id before
    if acq_id not in run_info_cache:
        adc_min = 0
        adc_max = 2047
        device_type_guess = "promethion"
        if channel_id.attrs["digitisation"] == 8192:
            adc_min = -4096
            adc_max = 4095
            device_type_guess = "minion"

        # Add new run_info to cache
        run_info_cache[acq_id] = convert_run_info(
            acq_id=acq_id,
            adc_max=adc_max,
            adc_min=adc_min,
            sample_rate=int(channel_id.attrs["sampling_rate"]),
            context_tags=dict(fast5_read["context_tags"].attrs),
            device_type=device_type_guess,
            tracking_id=dict(fast5_read["tracking_id"].attrs),
        )

    # Process attributes unique to this read
    read_id = uuid.UUID(decode_str(raw.attrs["read_id"]))
    pore = p5.Pore(
        channel=int(channel_id.attrs["channel_number"]),
        well=raw.attrs["start_mux"],
        pore_type=decode_str(attrs.get("pore_type", b"not_set")),
    )
    calibration = p5.Calibration.from_range(
        offset=channel_id.attrs["offset"],
        adc_range=channel_id.attrs["range"],
        digitisation=channel_id.attrs["digitisation"],
    )

    end_reason = convert_fast5_end_reason(raw.attrs.get("end_reason", 0))

    # Signal conversion process
    signal = raw["Signal"][()]
    signal_chunks, signal_chunk_lengths = vbz_compress_signal_chunked(
        signal, signal_chunk_size
    )

    return p5.CompressedRead(
        read_id=read_id,
        pore=pore,
        calibration=calibration,
        read_number=raw.attrs["read_number"],
        start_sample=raw.attrs["start_time"],
        median_before=raw.attrs["median_before"],
        num_minknow_events=raw.attrs.get("num_minknow_events", 0),
        tracked_scaling=p5.pod5_types.ShiftScalePair(
            raw.attrs.get("tracked_scaling_shift", float("nan")),
            raw.attrs.get("tracked_scaling_scale", float("nan")),
        ),
        predicted_scaling=p5.pod5_types.ShiftScalePair(
            raw.attrs.get("predicted_scaling_shift", float("nan")),
            raw.attrs.get("predicted_scaling_scale", float("nan")),
        ),
        num_reads_since_mux_change=raw.attrs.get("num_reads_since_mux_change", 0),
        time_since_mux_change=raw.attrs.get("time_since_mux_change", 0.0),
        open_pore_level=float("nan"),  # Not supported in fast5
        end_reason=end_reason,
        run_info=run_info_cache[acq_id],
        signal_chunks=signal_chunks,
        signal_chunk_lengths=signal_chunk_lengths,
    )


def get_read_from_fast5(group_name: str, h5_file: h5py.File) -> Optional[h5py.Group]:
    """Read a group from a h5 file ensuring that it's a read"""
    if not group_name.startswith("read_"):
        return None

    try:
        return h5_file[group_name]
    except KeyError as exc:
        # Observed strange behaviour where h5py reports a KeyError with
        # the message "Unable to open object". Report a failed read as warning
        warnings.warn(
            f"Failed to read key {group_name} from {h5_file.filename} : {exc}",
        )
    return None


def convert_fast5_file_chunk(
    queues: QueueManager,
    handle: h5py.File,
    chunk: Iterable[str],
    cache: Dict[str, p5.RunInfo],
    signal_chunk_size: int,
) -> List[CompressedRead]:
    reads: List[p5.CompressedRead] = []

    # Allow request queue to throttle work
    queues.await_request()
    try:
        for group_name in chunk:
            f5_read = get_read_from_fast5(group_name, handle)
            if f5_read is None:
                continue
            read = convert_fast5_read(f5_read, cache, signal_chunk_size)
            reads.append(read)

    except Exception as exc:
        # Ensures that requests aren't exhausted
        queues.enqueue_request()
        raise exc
    return reads


@logged_all
def convert_fast5_file(
    path: Path,
    queues: QueueManager,
    signal_chunk_size: int = DEFAULT_SIGNAL_CHUNK_SIZE,
) -> int:
    """Convert the reads in a fast5 file"""

    run_info_cache: Dict[str, p5.RunInfo] = {}
    total_reads: int = 0

    with h5py.File(str(path), "r") as _f5:
        for chunk in more_itertools.chunked(_f5.keys(), READ_CHUNK_SIZE):
            reads = convert_fast5_file_chunk(
                queues, _f5, chunk, run_info_cache, signal_chunk_size
            )
            queues.enqueue_data(path, reads)
            total_reads += len(reads)

    return total_reads


@logged()
def issue_not_multi_read_exception(path: Path, queues: QueueManager):
    logger.error(f"Input {path.name} is not a multi-read fast5")
    queues.enqueue_exception(
        path=path,
        exception=TypeError(f"{path} is not a multi-read fast5 file."),
        trace="",
    )
    logger.info(f"Enqueueing file end: {path.name} reads: 0")
    queues.enqueue_data(path, 0)


@logged(log_time=True)
def convert_fast5_files(
    queues: QueueManager,
    signal_chunk_size: int = DEFAULT_SIGNAL_CHUNK_SIZE,
) -> None:
    """
    Main function for converting fast5s available in queues.
    Collections of converted reads are emplaced on the data_queue for writing in
    the main process.
    """
    while True:
        path = queues.get_input()

        if path is None:
            logger.info("Inputs exhausted. Closing Process")
            break

        if not is_multi_read_fast5(path):
            issue_not_multi_read_exception(path, queues)
            continue

        try:
            total_reads = convert_fast5_file(path, queues, signal_chunk_size)
            logger.info(f"Enqueueing file end: {path.name} reads: {total_reads}")
            queues.enqueue_data(path, total_reads)

        except Exception as exc:
            import traceback

            logger.error(f"Enqueueing exception: {path.name} {exc}")
            queues.enqueue_exception(path, exc, traceback.format_exc())

    logger.info("Enqueue sentinel")
    queues.enqueue_data(None, None)


@logged(log_args=True)
def handle_exception(
    exception: Tuple[Path, Exception, str],
    output_handler: OutputHandler,
    status: StatusMonitor,
    strict: bool,
) -> None:
    path, exc, trace = exception
    status.write(str(exc), sys.stderr)
    output_handler.set_input_complete(path, is_exception=True)

    if strict:
        status.close()
        logger.fatal("Exception raised and --strict set")
        logger.debug(f"trace: {trace}")
        raise exc


@logged_all
def process_conversion_tasks(
    queues: QueueManager,
    output_handler: OutputHandler,
    status: StatusMonitor,
    strict: bool,
    threads: int = DEFAULT_THREADS,
) -> None:
    """Work through the queues of data until all work is done"""

    count_complete_processes = 0
    while count_complete_processes < threads:
        # Always poll exceptions to ensure they're handled
        exception = queues.get_exception()
        if exception is not None:
            handle_exception(
                exception=exception,
                output_handler=output_handler,
                status=status,
                strict=strict,
            )
            continue

        path, data = queues.await_data()

        # Handle exhausted processes
        if path is None:
            # Processed finished sentinel
            count_complete_processes += 1
            logger.info(
                f"Got process end sentinel {count_complete_processes} of {threads}"
            )
            continue

        # Update the progress bar with the total number of converted reads in the file
        if isinstance(data, int):
            status.update_reads_total(path, data)
            output_handler.set_input_complete(path, is_exception=False)
            continue

        # Write the incoming list of converted reads
        writer = output_handler.get_writer(path)
        if writer is None:
            logger.warn(
                f"Trying to write to {path} writer which was closed by an exception"
            )
        else:
            logger.info(f"Writing {len(data)} reads to {path.name} using {writer}")
            writer.add_reads(data)
            status.increment_reads(len(data))

    status.close()


@logged(log_time=True)
def convert_from_fast5(
    inputs: List[Path],
    output: Path,
    recursive: bool = False,
    threads: int = DEFAULT_THREADS,
    one_to_one: Optional[Path] = None,
    force_overwrite: bool = False,
    signal_chunk_size: int = DEFAULT_SIGNAL_CHUNK_SIZE,
    strict: bool = False,
) -> None:
    """
    Convert fast5 files found (optionally recursively) at the given input Paths
    into pod5 file(s). If one_to_one is a Path then the new pod5 files are
    created in a new relative directory structure within output relative to the the
    one_to_one Path.
    """

    if output.is_file() and not force_overwrite:
        raise FileExistsError(
            "Output path points to an existing file and --force-overwrite not set"
        )

    if len(output.parts) > 1:
        output.parent.mkdir(parents=True, exist_ok=True)

    threads = limit_threads(threads)

    pending_fast5s = collect_inputs(inputs, recursive, "*.fast5", threads=threads)
    if not pending_fast5s:
        logger.fatal(f"Found no *.fast5 files in inputs: {inputs}")
        raise RuntimeError("Found no fast5 inputs to process - Exiting")

    output_handler = OutputHandler(output, one_to_one, force_overwrite)
    status = StatusMonitor(pending_fast5s)

    threads = min(threads, len(pending_fast5s))
    ctx = mp.get_context("spawn")
    queues = QueueManager(
        context=ctx,
        inputs=pending_fast5s,
        threads=threads,
        timeout=TIMEOUT_SECONDS,
    )

    active_processes = []
    for _ in range(threads):
        process = ctx.Process(
            target=convert_fast5_files,
            args=(queues, signal_chunk_size),
            daemon=True,
        )
        process.start()
        active_processes.append(process)

    try:
        process_conversion_tasks(
            queues=queues,
            output_handler=output_handler,
            status=status,
            strict=strict,
            threads=threads,
        )

        queues.shutdown()
        for proc in active_processes:
            proc.join()
            proc.close()

    except Exception as exc:
        status.write(f"An unexpected error occurred: {exc}", file=sys.stderr)
        terminate_processes(active_processes)
        raise exc

    finally:
        output_handler.close_all()
        logger.disabled = True


def main():
    """Main function for pod5_convert_from_fast5"""
    run_tool(pod5_convert_from_fast5_argparser())


if __name__ == "__main__":
    main()


================================================
FILE: python/pod5/src/pod5/tools/pod5_convert_to_fast5.py
================================================
"""
Tool for converting pod5 files to the legacy fast5 format
"""

import time
from concurrent.futures import Future, ProcessPoolExecutor, as_completed
from pathlib import Path
from typing import Dict, List, Tuple

import h5py
import numpy
import vbz_h5py_plugin  # noqa: F401
from more_itertools import chunked

import pod5 as p5
from pod5.tools.parsers import pod5_convert_to_fast5_argparser, run_tool
from pod5.tools.utils import DEFAULT_THREADS, collect_inputs, limit_threads

# Pod5 does not have 'partial' so need to add that back in here.
FAST5_END_REASONS = {
    "unknown": 0,
    "partial": 1,  # Do not remove, required by fast5.
    "mux_change": 2,
    "unblock_mux_change": 3,
    "data_service_unblock_mux_change": 4,
    "signal_positive": 5,
    "signal_negative": 6,
    "api_request": 7,
    "device_data_error": 8,
    "analysis_config_change": 9,
    "paused": 10,
}

# Fast5 types
FAST5_END_REASON_TYPE = h5py.enum_dtype(FAST5_END_REASONS)
FAST5_STRING_TYPE = h5py.string_dtype("ascii")


class StatusMonitor:
    """Class for monitoring the status / progress of the conversion"""

    def __init__(self, file_count: int):
        self.update_interval = 10

        self.file_count = file_count
        self.files_started = 0
        self.files_ended = 0
        self.read_count = 0
        self.reads_processed = 0
        self.sample_count = 0

        self.time_start = self.time_last_update = time.time()

    @property
    def running(self) -> bool:
        """Return true if not all files have finished processing"""
        return self.files_ended < self.file_count

    def increment(
        self,
        *,
        files_started: int = 0,
        files_ended: int = 0,
        read_count: int = 0,
        reads_processed: int = 0,
        sample_count: int = 0,
    ) -> None:
        """Incremeent the status counters"""
        self.files_started += files_started
        self.files_ended += files_ended
        self.read_count += read_count
        self.reads_processed += reads_processed
        self.sample_count += sample_count

    @property
    def samples_mb(self) -> float:
        """Return the samples count in megabytes"""
        return (self.sample_count * 2) / 1_000_000

    @property
    def time_elapsed(self) -> float:
        """Return the total time elapsed in seconds"""
        return self.time_last_update - self.time_start

    @property
    def sample_rate(self) -> float:
        """Return the time averaged sample rate"""
        return self.samples_mb / self.time_elapsed

    def print_status(self, force: bool = False):
        """Print the status if the update interval has passed or if forced"""
        now = time.time()

        if force or self.time_last_update + self.update_interval < now:
            self.time_last_update = now

            print(
                f"{self.reads_processed} reads,\t",
                f"{self.formatted_sample_count},\t",
                f"{self.files_ended}/{self.file_count} files,\t",
                f"{self.sample_rate:.1f} MB/s",
            )

    @property
    def formatted_sample_count(self) -> str:
        """Return the sample count as a string with leading Metric prefix if necessary"""
        units = [
            (1000000000000, "T"),
            (1000000000, "G"),
            (1000000, "M"),
            (1000, "K"),
        ]

        for div, unit in units:
            if self.sample_count > div:
                return f"{self.sample_count/div:.1f} {unit}Samples"
        return f"{self.sample_count} Samples"


def write_pod5_record_to_fast5(read: p5.ReadRecord, fast5: h5py.File) -> None:
    tracking_id = read.run_info.tracking_id

    read_group = fast5.create_group(f"read_{read.read_id}")
    read_group.attrs.create(
        "run_id",
        tracking_id["run_id"].encode("ascii"),
        dtype=FAST5_STRING_TYPE,
    )
    read_group.attrs.create(
        "pore_type",
        read.pore.pore_type.encode("ascii"),
        dtype=FAST5_STRING_TYPE,
    )

    tracking_id_group = read_group.create_group("tracking_id")
    for k, v in tracking_id.items():
        tracking_id_group.attrs[k] = v

    context_tags_group = read_group.create_group("context_tags")
    for k, v in read.run_info.context_tags.items():
        context_tags_group.attrs[k] = v

    channel_id_group = read_group.create_group("channel_id")
    digitisation = read.run_info.adc_max - read.run_info.adc_min + 1
    channel_id_group.attrs.create("digitisation", digitisation, dtype=numpy.float64)
    channel_id_group.attrs.create(
        "offset", read.calibration.offset, dtype=numpy.float64
    )

    channel_id_group.attrs.create(
        "range", digitisation * read.calibration.scale, dtype=numpy.float64
    )
    channel_id_group.attrs.create(
        "sampling_rate", read.run_info.sample_rate, dtype=numpy.float64
    )
    channel_id_group.attrs["channel_number"] = str(read.pore.channel)

    raw_group = read_group.create_group("Raw")
    raw_group.create_dataset(
        "Signal",
        data=read.signal,
        dtype=numpy.int16,
        compression=32020,
        compression_opts=(0, 2, 1, 1),
    )
    raw_group.attrs.create("start_time", read.start_sample, dtype=numpy.uint64)
    raw_group.attrs.create("duration", read.sample_count, dtype=numpy.uint32)
    raw_group.attrs.create("read_number", read.read_number, dtype=numpy.int32)
    raw_group.attrs.create("start_mux", read.pore.well, dtype=numpy.uint8)
    raw_group.attrs["read_id"] = str(read.read_id).encode("utf-8")
    raw_group.attrs.create("median_before", read.median_before, dtype=numpy.float64)

    # Lookup the fast5 enumeration values, which should include "partial: 1"
    # This will ensure that the enumeration is valid on a round-trip
    raw_group.attrs.create(
        "end_reason",
        FAST5_END_REASONS[read.end_reason.name],
        dtype=FAST5_END_REASON_TYPE,
    )

    raw_group.attrs.create(
        "num_minknow_events", read.num_minknow_events, dtype=numpy.uint64
    )

    raw_group.attrs.create(
        "tracked_scaling_scale",
        read.tracked_scaling.scale,
        dtype=numpy.float32,
    )
    raw_group.attrs.create(
        "tracked_scaling_shift",
        read.tracked_scaling.shift,
        dtype=numpy.float32,
    )
    raw_group.attrs.create(
        "predicted_scaling_scale",
        read.predicted_scaling.scale,
        dtype=numpy.float32,
    )
    raw_group.attrs.create(
        "predicted_scaling_shift",
        read.predicted_scaling.shift,
        dtype=numpy.float32,
    )
    raw_group.attrs.create(
        "num_reads_since_mux_change",
        read.num_reads_since_mux_change,
        dtype=numpy.uint32,
    )
    raw_group.attrs.create(
        "time_since_mux_change",
        read.time_since_mux_change,
        dtype=numpy.float32,
    )
    # Note dropping the 'open_pore_level' attribute as it is not supported in fast5


def convert_pod5_to_fast5(
    source: Path, dest: Path, read_ids: List[str]
) -> Tuple[int, int]:
    """
    Open a source pod5 file and write the selected read_ids into the destination fast5
    file target.
    """

    dest.parent.mkdir(parents=True, exist_ok=True)

    if dest.exists():
        dest.unlink()

    total_samples = 0

    with p5.Reader(source) as reader:
        with h5py.File(dest, "w") as f5:
            f5.attrs.create(
                "file_version", "3.0".encode("ascii"), dtype=FAST5_STRING_TYPE
            )
            f5.attrs.create(
                "file_type", "multi-read".encode("ascii"), dtype=FAST5_STRING_TYPE
            )

            # Take the chunk of read ids for this file
            for read in reader.reads(
                selection=read_ids, missing_ok=False, preload={"samples"}
            ):
                write_pod5_record_to_fast5(read, f5)

                total_samples += read.num_samples

    return (len(read_ids), total_samples)


def convert_to_fast5(
    inputs: List[Path],
    output: Path,
    recursive: bool = False,
    threads: int = DEFAULT_THREADS,
    force_overwrite: bool = False,
    file_read_count: int = 4000,
):
    if output.exists() and not output.is_dir():
        raise FileExistsError("Cannot output to a file")

    threads = limit_threads(threads)

    with ProcessPoolExecutor(max_workers=threads) as executor:
        total_reads = 0
        futures: Dict[Future, Path] = {}

        # Enumerate over input pod5 files
        for input_idx, source in enumerate(
            collect_inputs(inputs, recursive, "*.pod5", threads=threads)
        ):
            # Open the inputs to read the read ids
            with p5.Reader(source) as reader:
                for chunk_idx, read_ids in enumerate(
                    chunked(reader.read_ids, file_read_count)
                ):
                    dest = (
                        output / f"{source.stem}.{chunk_idx}_{input_idx}.fast5"
                    ).resolve()

                    if dest.exists() and not force_overwrite:
                        raise FileExistsError(
                            "Output path points to an existing file and --force-overwrite not set"
                        )

                    kwargs = {
                        "source": source,
                        "dest": dest,
                        "read_ids": read_ids,
                    }
                    futures[executor.submit(convert_pod5_to_fast5, **kwargs)] = dest  # type: ignore

                total_reads += len(reader.read_ids)

        print(f"Converting pod5s into {len(futures)} fast5 files. Please wait...")

        status = StatusMonitor(file_count=len(inputs))
        status.increment(files_started=len(inputs), read_count=total_reads)

        for idx, future in enumerate(as_completed(futures)):
            (reads_converted, samples_converted) = future.result()

            status.increment(
                files_ended=1,
                sample_count=samples_converted,
                reads_processed=reads_converted,
            )
            status.print_status()

        status.print_status(force=True)

        print("Conversion complete")


def main():
    run_tool(pod5_convert_to_fast5_argparser())


if __name__ == "__main__":
    main()


================================================
FILE: python/pod5/src/pod5/tools/pod5_filter.py
================================================
"""
Tool for subsetting pod5 files into one or more outputs using a list of read ids
"""

from pathlib import Path
from typing import List

import lib_pod5 as p5b
import polars as pl

from pod5.tools.parsers import prepare_pod5_filter_argparser, run_tool
from pod5.tools.pod5_subset import build_targets_dict
from pod5.tools.polars_utils import PL_DEST_FNAME, PL_READ_ID, PL_UUID_REGEX
from pod5.tools.utils import (
    DEFAULT_THREADS,
    collect_inputs,
    init_logging,
    limit_threads,
    logged_all,
)

logger = init_logging()

pl.enable_string_cache()


@logged_all
def parse_read_id_targets(ids: Path, output: Path) -> pl.LazyFrame:
    """Parse the list of read_ids checking all are valid uuids"""
    read_ids = (
        pl.scan_csv(
            ids,
            has_header=False,  # Any header will be filtered out by is_uuid
            comment_prefix="#",
            new_columns=[PL_READ_ID],
            rechunk=False,
        )
        .drop_nulls()
        .unique()
        .with_columns(
            [
                pl.lit(str(output.resolve())).cast(pl.Categorical).alias(PL_DEST_FNAME),
                pl.col(PL_READ_ID).str.contains(PL_UUID_REGEX).alias("is_uuid"),
            ]
        )
        .filter(pl.col("is_uuid"))
        .drop("is_uuid")
    )

    if len(read_ids.fetch(10)) == 0:
        raise AssertionError(f"Found 0 read_ids in {ids}. Nothing to do")

    return read_ids


@logged_all
def filter_pod5(
    inputs: List[Path],
    output: Path,
    ids: Path,
    missing_ok: bool = False,
    force_overwrite: bool = False,
    recursive: bool = False,
    threads: int = DEFAULT_THREADS,
) -> int:
    """Prepare the pod5 filter mapping and run the repacker"""
    # Remove output file
    if output.exists():
        if not force_overwrite:
            raise FileExistsError(
                f"Output file already exists and --force-overwrite not set - {output}"
            )
        else:
            output.unlink()

    # Create parent directories if they do not exist
    if not output.parent.exists():
        output.parent.mkdir(parents=True, exist_ok=True)

    targets = parse_read_id_targets(ids, output=output)
    print(f"Parsed {len(targets.collect())} reads_ids from: {ids.name}")

    threads = limit_threads(threads)

    _inputs = collect_inputs(inputs, recursive, "*.pod5", threads=threads)

    targets_dict = build_targets_dict(targets)

    try:
        p5b.subset_pod5s_with_mapping(
            list(_inputs),
            output,
            targets_dict,
            # threads=threads,
            missing_ok,
            False,
            force_overwrite,
        )
    except KeyboardInterrupt:
        print("Stopped POD5 filter following keyboard interrupt.")
        return 1

    return 0


@logged_all
def main():
    """pod5 filter main"""
    run_tool(prepare_pod5_filter_argparser())


if __name__ == "__main__":
    main()


================================================
FILE: python/pod5/src/pod5/tools/pod5_inspect.py
================================================
"""
Tool for inspecting the contents of pod5 files
"""

import csv
import os
import sys
from dataclasses import asdict
from pathlib import Path
from typing import Callable, Dict, List
from uuid import UUID

import pod5 as p5
from pod5.tools.parsers import prepare_pod5_inspect_argparser, run_tool
from pod5.tools.utils import collect_inputs


def format_shift_scale_pair(pair):
    return f"({pair.shift} {pair.scale})"


def format_shift_scale_pair_num(pair):
    return f"({pair.shift:.1f} {pair.scale:.1f})"


def do_reads_command(reader: p5.Reader, write_header: bool):
    keys = [
        "read_id",
        "channel",
        "well",
        "pore_type",
        "read_number",
        "start_sample",
        "end_reason",
        "median_before",
        "num_samples",
        "byte_count",
        "signal_compression_ratio",
        "num_minknow_events",
        "tracked_scaling",
        "predicted_scaling",
        "num_reads_since_mux_change",
        "time_since_mux_change",
        "open_pore_level",
    ]

    csv_read_writer = csv.DictWriter(sys.stdout, keys)

    # Only write header on first call
    if write_header:
        csv_read_writer.writeheader()

    for read in reader.reads():
        fields = {
            "read_id": read.read_id,
            "channel": read.pore.channel,
            "well": read.pore.well,
            "pore_type": read.pore.pore_type,
            "read_number": read.read_number,
            "start_sample": read.start_sample,
            "end_reason": read.end_reason.name,
            "median_before": f"{read.median_before:.1f}",
            "num_samples": read.num_samples,
            "byte_count": read.byte_count,
            "signal_compression_ratio": f"{read.byte_count / float(read.sample_count*2):.3f}",
            "num_minknow_events": read.num_minknow_events,
            "tracked_scaling": format_shift_scale_pair_num(read.tracked_scaling),
            "predicted_scaling": format_shift_scale_pair_num(read.predicted_scaling),
            "num_reads_since_mux_change": read.num_reads_since_mux_change,
            "time_since_mux_change": read.time_since_mux_change,
            "open_pore_level": read.open_pore_level,
        }

        try:
            csv_read_writer.writerow(fields)
        except BrokenPipeError:
            devnull = os.open(os.devnull, os.O_WRONLY)
            os.dup2(devnull, sys.stdout.fileno())
            break


def dump_run_info(run_info: p5.RunInfo):
    tab = "\t"
    for name, value in asdict(run_info).items():
        if isinstance(value, list):
            print(f"{tab}{name}:")
            for k, v in value:
                print(f"{tab*2}{k}: {v}")
        else:
            print(f"{tab}{name}: {value}")


def do_read_command(reader: p5.Reader, read_id: str, **_):
    try:
        uuid_read_id = UUID(read_id)

    except ValueError:
        print(f"Supplied read_id '{read_id}' is not a valid UUID", file=sys.stderr)
        return

    for read in reader.reads():
        if read.read_id != uuid_read_id:
            continue

        print(f"read_id: {read.read_id}")
        print(f"read_number:\t{read.read_number}")
        print(f"start_sample:\t{read.start_sample}")
        print(f"median_before:\t{read.median_before}")
        print(f"open_pore_level:\t{read.open_pore_level}")
        print("channel data:")
        print(f"\tchannel: {read.pore.channel}")
        print(f"\twell: {read.pore.well}")
        print(f"\tpore_type: {read.pore.pore_type}")
        print("end reason:")
        print(f"\tname: {read.end_reason.name}")
        print(f"\tforced: {read.end_reason.forced}")
        print("calibration:")
        print(f"\toffset: {read.calibration.offset}")
        print(f"\tscale: {read.calibration.scale}")
        print("samples:")
        print(f"\tsample_count: {read.sample_count}")
        print(f"\tbyte_count: {read.byte_count}")
        print(
            f"\tcompression ratio: {read.byte_count / float(read.sample_count*2):.3f}"
        )

        print("run info:")
        dump_run_info(read.run_info)
        break


def do_debug_command(reader: p5.Reader, **_):
    batch_count = 0
    batch_sizes = []
    read_count = 0
    sample_count = 0
    byte_count = 0
    min_sample = float("inf")
    max_sample = 0

    run_infos = {}

    for batch in reader.read_batches():
        batch_count += 1

        batch_read_count = 0
        for read in batch.reads():
            batch_read_count += 1
            read_sample_count = read.sample_count
            sample_count += read_sample_count
            byte_count += read.byte_count

            run_info_index = read.run_info_index
            if run_info_index not in run_infos:
                run_infos[run_info_index] = read.run_info

            min_sample = min(min_sample, read.start_sample)
            max_sample = max(max_sample, read.start_sample + read_sample_count)
        batch_sizes.append(batch_read_count)
        read_count += batch_read_count

    print(f"Contains {read_count} reads, in {batch_count} batches: {batch_sizes}")
    print(f"Reads span from sample {min_sample} to {max_sample}")
    print(
        f"{sample_count} samples, {byte_count}"
        f" bytes: {100*byte_count/float(sample_count*2):.1f} % signal compression ratio"
    )

    for idx, run_info in run_infos.items():
        print(f"Run info {idx}:")
        dump_run_info(run_info)


def do_summary_command(reader: p5.Reader, **kwargs):
    batch_count = 0
    total_read_count = 0

    print(
        f"Originating file version {reader.file_version}, in memory read table version {reader.reads_table_version}."
    )
    print(f"File version on disk {reader.file_version_pre_migration}.")
    if reader.is_vbz_compressed:
        print("File uses VBZ compression.")
    else:
        print("File is uncompressed.")

    for batch in reader.read_batches():
        batch_count += 1

        batch_read_count = 0
        for _ in batch.reads():
            batch_read_count += 1

        print(f"Batch {batch_count}, {batch_read_count} reads")
        total_read_count += batch_read_count
    print(f"Found {batch_count} batches, {total_read_count} reads")


def inspect_pod5(
    command: str, input_files: List[Path], recursive: bool = False, **kwargs
):
    """Determine which inspect command to run from the parsed arguments and run it"""

    commands: Dict[str, Callable] = {
        "reads": do_reads_command,
        "read": do_read_command,
        "summary": do_summary_command,
        "debug": do_debug_command,
    }

    for idx, filename in enumerate(
        collect_inputs(input_files, recursive=recursive, pattern="*.pod5")
    ):
        try:
            reader = p5.Reader(filename)
        except Exception as exc:
            print(f"Failed to open pod5 file: {filename}: {exc}", file=sys.stderr)
            continue

        kwargs["reader"] = reader
        kwargs["write_header"] = idx == 0
        commands[command](**kwargs)


def main():
    """Run the pod5 inspect tool"""
    run_tool(prepare_pod5_inspect_argparser())


if __name__ == "__main__":
    main()


================================================
FILE: python/pod5/src/pod5/tools/pod5_merge.py
================================================
"""
Tool for merging pod5 files
"""

from time import sleep
from typing import Iterable
from pathlib import Path
from tqdm.auto import tqdm

import pod5 as p5
import pod5.repack as p5_repack
from pod5.tools.parsers import prepare_pod5_merge_argparser, run_tool
from pod5.tools.utils import (
    DEFAULT_THREADS,
    PBAR_DEFAULTS,
    collect_inputs,
    init_logging,
    logged_all,
)

logger = init_logging()


@logged_all
def merge_pod5(
    inputs: Iterable[Path],
    output: Path,
    force_overwrite: bool = False,
    recursive: bool = False,
    threads: int = DEFAULT_THREADS,
    readers: int = 5,
) -> None:
    """
    Merge the an iterable of input pod5 paths into the specified output path
    """

    if output.exists():
        if force_overwrite:
            output.unlink()
        else:
            raise FileExistsError(
                f"Output files already exists and --force-overwrite not set. "
                f"Refusing to overwrite {output}."
            )

    if not output.parent.exists():
        output.parent.mkdir(parents=True, exist_ok=True)

    _inputs = collect_inputs(
        inputs, recursive=recursive, pattern="*.pod5", threads=threads
    )

    print(f"Merging reads from {len(_inputs)} files")
    logger.debug(f"Merging reads from {len(_inputs)} files into {output.absolute()}")

    # Open the output file writer
    with p5.Writer(output.absolute()) as writer:
        # Attach the writer to the repacker
        repacker = p5_repack.Repacker()
        repacker_output = repacker.add_output(writer, True)

        pbar = tqdm(
            total=len(_inputs),
            desc="Merging",
            unit="File",
            leave=True,
            position=0,
            **PBAR_DEFAULTS,
        )

        active_limit = max(readers, 1)
        logger.debug(f"{active_limit=}")

        opened_readers = 0
        active = 0
        while _inputs or active > 0:
            pbar.update(opened_readers - active - pbar.n)

            active = repacker.currently_open_file_reader_count
            if _inputs and (active < active_limit):
                next_input = _inputs.pop()
                logger.debug(f"submitting: {next_input=}")
                with p5.Reader(next_input) as reader:
                    opened_readers += 1
                    repacker.add_all_reads_to_output(repacker_output, reader)
                    continue

            if not _inputs:
                logger.debug("no inputs remaining - finishing")
                repacker.set_output_finished(repacker_output)
                break

            sleep(0.2)
            logger.debug(f"{len(_inputs)=}, {active=}, {(active > 0)=}")

        repacker.finish()
        del repacker
        pbar.update(opened_readers - active - pbar.n)
        pbar.close()

    return


def main():
    """pod5_merge main program"""
    run_tool(prepare_pod5_merge_argparser())


if __name__ == "__main__":
    main()


================================================
FILE: python/pod5/src/pod5/tools/pod5_recover.py
================================================
"""
Tool for recovering truncated pod5 files
"""

import dataclasses
import typing
from contextlib import suppress
from pathlib import Path

import lib_pod5 as p5b
import pod5 as p5
from pod5.tools.parsers import prepare_pod5_recover_argparser, run_tool
from pod5.tools.utils import collect_inputs


@dataclasses.dataclass
class RecoveredData:
    """
    Holds info about recovered data.
    """

    signal_rows: int = 0
    reads: int = 0
    run_infos: int = 0
    files_with_errors: int = 0


def is_file_ok(path: Path) -> bool:
    try:
        with p5.Reader(path):
            pass
        return True
    except RuntimeError:
        return False


def recover_pod5(
    inputs: typing.List[Path], force_overwrite: bool, recursive: bool, cleanup: bool
):
    """
    Given a list of truncated pod5 files, recover their data.
    """

    paths = collect_inputs(inputs, recursive=recursive, pattern=["*.tmp", "*.pod5"])

    paths_to_recover = [p for p in paths if not is_file_ok(p)]

    if len(paths_to_recover) == 0:
        print(f"None of the {len(paths)} files given need recovery")
        return

    for path in paths_to_recover:
        dest = path.parent / (path.stem + "_recovered.pod5")
        if dest.exists():
            if force_overwrite:
                dest.unlink()
            else:
                raise FileExistsError(
                    f"Output files already exists and --force-overwrite not set. "
                    f"Refusing to overwrite {dest}."
                )

    recovered_data = RecoveredData()
    options = p5b.RecoverFileOptions()
    options.cleanup = cleanup
    for input_file in paths_to_recover:
        dest = input_file.parent / (input_file.stem + "_recovered.pod5")
        try:
            details = p5b.recover_file(
                str(input_file.resolve()), str(dest.resolve()), options
            )
            recovered_data.signal_rows += details.row_counts.signal
            recovered_data.run_infos += details.row_counts.run_info
            recovered_data.reads += details.row_counts.reads
            print(f"{dest} - Recovered")
            for cleanup_error in details.cleanup_errors:
                print(
                    "Warning cleanup failed to cleanup file "
                    + f"'{cleanup_error.file_path}' due to : {cleanup_error.description}"
                )
        except RuntimeError as error:
            recovered_data.files_with_errors += 1
            print(f"{dest} - Recovery failed - {str(error)}")
            with suppress(FileNotFoundError):
                dest.unlink()

    print(
        f"Recovered {recovered_data.signal_rows} signal rows, "
        f"{recovered_data.reads} reads, "
        f"{recovered_data.run_infos} run infos, "
        f"{recovered_data.files_with_errors} files with errors"
    )


def main():
    run_tool(prepare_pod5_recover_argparser())


if __name__ == "__main__":
    main()


================================================
FILE: python/pod5/src/pod5/tools/pod5_repack.py
================================================
"""
Tool for repacking pod5 files to potentially improve performance
"""

from concurrent.futures import ProcessPoolExecutor, as_completed
import typing
from pathlib import Path
from tqdm.auto import tqdm

import pod5 as p5
import pod5.repack
from pod5.tools.utils import (
    DEFAULT_THREADS,
    PBAR_DEFAULTS,
    assert_no_duplicate_filenames,
    collect_inputs,
    limit_threads,
)
from pod5.tools.parsers import prepare_pod5_repack_argparser, run_tool


def resolve_overwrite(src: Path, dest: Path, force: bool) -> None:
    if dest.exists():
        if dest == src:
            raise FileExistsError(f"Refusing to overwrite {src} inplace")
        if force:
            dest.unlink()
        else:
            raise FileExistsError(
                "Refusing to overwrite output without --force-overwrite"
            )


def repack_pod5_file(src: Path, dest: Path):
    """Repack the source pod5 file into dest"""
    repacker = pod5.repack.Repacker()
    with p5.Writer(dest) as writer:
        repacker_output = repacker.add_output(writer, False)
        with p5.Reader(src) as reader:
            # Add all reads to the repacker
            repacker.add_all_reads_to_output(repacker_output, reader)
        repacker.set_output_finished(repacker_output)
        repacker.finish()


def repack_pod5(
    inputs: typing.List[Path],
    output: Path,
    threads: int = DEFAULT_THREADS,
    force_overwrite: bool = False,
    recursive: bool = False,
):
    """Given a list of pod5 files, repack their contents and write files 1-1"""

    if output.exists() and not output.is_dir():
        raise ValueError(f"Output cannot be an existing file: {output}")

    # Create output directory if required
    if not output.is_dir():
        output.mkdir(parents=True, exist_ok=True)

    threads = limit_threads(threads)

    _inputs = collect_inputs(
        inputs, recursive=recursive, pattern="*.pod5", threads=threads
    )
    assert_no_duplicate_filenames(_inputs)

    # Remove existing files if required
    for input_filename in _inputs:
        output_filename = output / input_filename.name
        resolve_overwrite(input_filename, output_filename, force_overwrite)

    futures = {}
    with ProcessPoolExecutor(max_workers=threads) as executor:
        pbar = tqdm(total=len(_inputs), unit="Files", **PBAR_DEFAULTS)

        for src in _inputs:
            dest = output / src.name
            futures[executor.submit(repack_pod5_file, src=src, dest=dest)] = dest

        for future in as_completed(futures):
            tqdm.write(f"Finished {futures[future]}")
            pbar.update(1)

    pbar.close()
    print("Done")


def main():
    run_tool(prepare_pod5_repack_argparser())


if __name__ == "__main__":
    main()


================================================
FILE: python/pod5/src/pod5/tools/pod5_subset.py
================================================
"""
Tool for subsetting pod5 files into one or more outputs
"""

from collections import defaultdict
from copy import deepcopy
from pathlib import Path
from string import Formatter
from typing import List, Optional, Tuple

import lib_pod5 as p5b
import polars as pl

from pod5.tools.parsers import prepare_pod5_subset_argparser, run_tool
from pod5.tools.polars_utils import (
    PL_DEST_FNAME,
    PL_READ_ID,
    PL_UUID_REGEX,
)
from pod5.tools.utils import (
    DEFAULT_THREADS,
    collect_inputs,
    init_logging,
    logged,
    logged_all,
)

DEFAULT_READ_ID_COLUMN = "read_id"

logger = init_logging()

pl.enable_string_cache()


@logged_all
def get_separator(path: Path) -> str:
    """
    Inspect the first line of the file at path and attempt to determine the field
    separator as either tab or comma, depending on the number of occurrences of each
    Returns "," or "<tab>"
    """
    with path.open("r") as fh:
        line = fh.readline()
    n_tabs = line.count("\t")
    n_comma = line.count(",")
    if n_tabs >= n_comma:
        return "\t"
    return ","


@logged_all
def default_filename_template(subset_columns: List[str]) -> str:
    """Create the default filename template from the subset_columns selected"""
    default = "_".join(f"{col}-{{{col}}}" for col in subset_columns)
    default += ".pod5"
    return default


@logged_all
def column_keys_from_template(template: str) -> List[str]:
    """Get a list of placeholder keys in the template"""
    return [key for _, key, _, _ in Formatter().parse(template) if key]


@logged_all
def fstring_to_polars(
    template: str,
) -> Tuple[str, List[str]]:
    """
    Replace f-string keyed placeholders with positional ones and return the keys in
    their respective position
    """
    # This is for pl.format positional syntax
    replaced = template
    keys = column_keys_from_template(template)
    for key in keys:
        replaced = replaced.replace(f"{{{key}}}", "{}")
    return replaced, keys


@logged_all
def parse_table_mapping(
    summary_path: Path,
    filename_template: Optional[str],
    subset_columns: List[str],
    read_id_column: str = DEFAULT_READ_ID_COLUMN,
    ignore_incomplete_template: bool = False,
) -> pl.LazyFrame:
    """
    Parse a table using polars to create a mapping of output targets to read ids
    """
    if not subset_columns:
        raise AssertionError("Missing --columns when using --summary / --table")

    if not filename_template:
        filename_template = default_filename_template(subset_columns)

    assert_filename_template(
        filename_template, subset_columns, ignore_incomplete_template
    )

    # Add the destination filename as a column
    pl_template, keys = fstring_to_polars(filename_template)

    columns = deepcopy(subset_columns)
    columns.append(read_id_column)

    targets = (
        pl.read_csv(
            summary_path,
            columns=columns,
            separator=get_separator(summary_path),
            comment_prefix="#",
        )
        .lazy()
        .with_columns(
            [
                pl.format(pl_template, *keys).cast(pl.Categorical).alias(PL_DEST_FNAME),
                pl.col(read_id_column).alias(PL_READ_ID),
            ]
        )
        .with_columns(
            [
                pl.col(PL_READ_ID).str.contains(PL_UUID_REGEX).alias("is_uuid"),
            ]
        )
        .filter(pl.col("is_uuid"))
        .drop("is_uuid")
    )
    return targets


@logged_all
def assert_filename_template(
    template: str, subset_columns: List[str], ignore_incomplete_template: bool
) -> None:
    """
    Get the keys named in the template to assert that they exist in subset_columns
    """
    # Parse the template string to get the keywords
    # "{hello}_world_{name}" -> ["hello", "name"]
    template_keys = set(args[1] for args in Formatter().parse(template) if args[1])
    allowed_keys = set(subset_columns)

    # Assert there are no unexpected keys in the template
    unexpected = template_keys - allowed_keys
    if unexpected:
        raise KeyError(f"--template {template} has unexpected keys: {unexpected}")

    # Assert there are no unused keys in the template
    # This is important as the output would be degenerate on some keys
    if not ignore_incomplete_template:
        unused = allowed_keys - template_keys
        if unused:
            raise KeyError(
                f"--template {template} does not use {unused} keys. "
                "Use --ignore-incomplete-template to suppress this exception."
            )


@logged_all
def create_default_filename_template(subset_columns: List[str]) -> str:
    """Create the default filename template from the subset_columns selected"""
    default = "_".join(f"{col}-{{{col}}}" for col in subset_columns)
    default += ".pod5"
    return default


@logged_all
def parse_csv_mapping(csv_path: Path) -> pl.LazyFrame:
    """Parse the csv direct mapping of output target to read_ids to a targets dataframe"""
    targets = (
        pl.scan_csv(
            csv_path,
            has_header=False,
            comment_prefix="#",
            new_columns=[PL_DEST_FNAME, PL_READ_ID],
            rechunk=False,
        )
        .drop_nulls()
        .with_columns(
            [
                pl.col(PL_DEST_FNAME).cast(pl.Categorical),
                pl.col(PL_READ_ID).str.contains(PL_UUID_REGEX).alias("is_uuid"),
            ]
        )
        .filter(pl.col("is_uuid"))
        .drop("is_uuid")
    )

    if len(targets.fetch(10)) == 0:
        raise AssertionError(f"Found 0 read_ids in {csv_path}. Nothing to do")

    return targets


@logged(log_time=True)
def build_targets_dict(
    targets: pl.LazyFrame,
) -> dict[str, list[str]]:
    """Build a dictionary of output filename to read_ids from the targets dataframe"""
    targets_dict = defaultdict(set)
    for row in targets.select([PL_READ_ID, PL_DEST_FNAME]).collect().iter_rows():
        read_id, fname = row
        targets_dict[fname].add(read_id)

    return {k: list(v) for k, v in targets_dict.items()}


@logged(log_time=True)
def subset_pod5(
    inputs: List[Path],
    output: Path,
    columns: List[str],
    csv: Optional[Path] = None,
    table: Optional[Path] = None,
    threads: int = DEFAULT_THREADS,
    template: str = "",
    read_id_column: str = DEFAULT_READ_ID_COLUMN,
    missing_ok: bool = False,
    ignore_incomplete_template: bool = False,
    force_overwrite: bool = False,
    recursive: bool = False,
) -> int:
    """Prepare the subsampling mapping and run the repacker"""

    if csv:
        targets = parse_csv_mapping(csv)

    elif table:
        targets = parse_table_mapping(
            table, template, columns, read_id_column, ignore_incomplete_template
        )

    else:
        raise RuntimeError(
            "Arguments provided could not be used to generate a subset mapping."
        )

    targets_dict = build_targets_dict(targets)

    if not output.exists():
        output.mkdir(parents=True)

    _inputs = collect_inputs(
        inputs, recursive=recursive, pattern="*.pod5", threads=threads
    )
    if len(_inputs) == 0:
        raise ValueError("Found no input pod5 files")

    try:
        p5b.subset_pod5s_with_mapping(
            list(_inputs),
            output,
            targets_dict,
            # threads=threads,
            missing_ok,
            False,
            force_overwrite,
        )
    except KeyboardInterrupt:
        print("Stopped POD5 subset following keyboard interrupt.")
        return 1
    return 0


@logged()
def main():
    """pod5 subsample main"""
    run_tool(prepare_pod5_subset_argparser())


if __name__ == "__main__":
    main()


================================================
FILE: python/pod5/src/pod5/tools/pod5_update.py
================================================
"""
Tool for updating pod5 files to the latest available version
"""

from typing import Iterable
from pathlib import Path

from tqdm.auto import tqdm

import lib_pod5 as p5b

import pod5 as p5
from pod5.tools.parsers import prepare_pod5_update_argparser, run_tool
from pod5.tools.utils import (
    PBAR_DEFAULTS,
    assert_no_duplicate_filenames,
    collect_inputs,
)


def update_pod5(
    inputs: Iterable[Path],
    output: Path,
    force_overwrite: bool = False,
    recursive: bool = False,
):
    """
    Given a list of pod5 files, update their tables to the most recent version
    """
    if not output.exists():
        output.mkdir(parents=True, exist_ok=True)

    paths = collect_inputs(inputs, recursive=recursive, pattern="*.pod5")
    assert_no_duplicate_filenames(paths)

    exists = set(output / p.name for p in paths if Path(output / p.name).exists())

    if not paths.isdisjoint(exists):
        inout = [p.name for p in exists - paths]
        raise AssertionError(f"Cannot update inputs in-place. Found: {inout}")

    if not force_overwrite and exists:
        raise FileExistsError(
            f"{len(exists)} Output files already exists and --force-overwrite not set. "
            f"Found: {exists}"
        )
    else:
        for path in exists:
            path.unlink()

    pbar = tqdm(
        total=len(paths), desc="Updating", unit="File", leave=True, **PBAR_DEFAULTS
    )

    for path in paths:
        dest = output / path.name
        with p5.Reader(path) as reader:
            p5b.update_file(reader.inner_file_reader, str(dest))
        pbar.update()


def main():
    run_tool(prepare_pod5_update_argparser())


if __name__ == "__main__":
    main()


================================================
FILE: python/pod5/src/pod5/tools/pod5_view.py
================================================
import codecs
import multiprocessing as mp
from multiprocessing.context import SpawnProcess
from multiprocessing.synchronize import Lock
import os
from pathlib import Path
from queue import Empty
import sys
from typing import Callable, Dict, Generator, List, NamedTuple, Optional, Set, Tuple

from pod5.reader import ArrowTableHandle
import polars as pl
import pyarrow as pa

import pod5 as p5
from pod5.tools.parsers import prepare_pod5_view_argparser, run_tool
from pod5.tools.polars_utils import (
    pl_format_empty_string,
    pl_format_read_id,
    pl_from_arrow,
    pl_from_arrow_batch,
)
from pod5.tools.utils import (
    DEFAULT_THREADS,
    collect_inputs,
    init_logging,
    limit_threads,
    logged,
    logged_all,
    terminate_processes,
)


logger = init_logging()

pl.enable_string_cache()


class Selection(NamedTuple):
    selected: Set[str]  # The set of column names selected
    reads_fields: Set[str]  # The set of read table fields required
    info_fields: Set[str]  # The set of run info table fields required

    def __contains__(self, key):
        return key in self.selected

    def union(self) -> Set[str]:
        return self.reads_fields.union(self.info_fields)


class Field(NamedTuple):
    """Container class for storing the expression for a named field"""

    docs: str
    reads_fields: Optional[List[str]] = None
    info_fields: Optional[List[str]] = None


# This dict defines the order of the fields
FIELDS: Dict[str, Field] = {
    "read_id": Field(
        "Read UUID",
        ["read_id"],
    ),
    "filename": Field(
        "Source pod5 filename",
    ),
    "read_number": Field(
        "Read number",
        ["read_number"],
    ),
    "channel": Field(
        "1-indexed channel",
        ["channel"],
    ),
    "mux": Field(
        "1-indexed well",
        ["well"],
    ),
    "end_reason": Field(
        "End reason string",
        ["end_reason"],
    ),
    "start_time": Field(
        "Seconds since the run start to the first sample of this read",
        ["start"],
        ["sample_rate"],
    ),
    "start_sample": Field(
        "Samples recorded on this channel since run start to the first sample of this read",
        ["start"],
    ),
    "duration": Field(
        "Seconds of sampling for this read",
        ["num_samples", "sample_rate"],
    ),
    "num_samples": Field(
        "Number of signal samples",
        ["num_samples"],
    ),
    "minknow_events": Field(
        "Number of minknow events that this read contains",
        ["num_minknow_events"],
    ),
    "sample_rate": Field(
        "Number of samples recorded each second",
        ["sample_rate"],
    ),
    "median_before": Field(
        "Current level in this well before the read",
        ["median_before"],
    ),
    # DEPRECATED
    "predicted_scaling_scale": Field(
        "Scale for predicted read scaling",
        ["predicted_scaling_scale"],
    ),
    # DEPRECATED
    "predicted_scaling_shift": Field(
        "Shift for predicted read scaling",
        ["predicted_scaling_shift"],
    ),
    # DEPRECATED
    "tracked_scaling_scale": Field(
        "Scale for tracked read scaling",
        ["tracked_scaling_scale"],
    ),
    # DEPRECATED
    "tracked_scaling_shift": Field(
        "Shift for tracked read scaling",
        ["tracked_scaling_shift"],
    ),
    "num_reads_since_mux_change": Field(
        "Number of selected reads since the last mux change on this channel",
        ["num_reads_since_mux_change"],
    ),
    "time_since_mux_change": Field(
        "Seconds since the last mux change on this channel",
        ["time_since_mux_change"],
    ),
    "run_id": Field("Run UUID", None, ["protocol_run_id"]),
    "sample_id": Field(
        "User-supplied name for the sample",
        None,
        ["sample_id"],
    ),
    "experiment_id": Field(
        "User-supplied name for the experiment",
        None,
        ["experiment_name"],
    ),
    "flow_cell_id": Field(
        "The flow cell id",
        None,
        ["flow_cell_id"],
    ),
    "pore_type": Field(
        "Name of the pore in this well",
        ["pore_type"],
    ),
    "open_pore_level": Field(
        "The tracked open pore level for this read",
        ["open_pore_level"],
    ),
}


@logged()
def print_fields():
    """Print a list of the available columns"""
    for name, field in FIELDS.items():
        print(f"{name.ljust(28)} {field.docs}")
    print("")


@logged_all
def get_field_or_raise(key: str) -> Field:
    """Get the Field for this key or raise a KeyError"""
    try:
        return FIELDS[key]
    except KeyError:
        raise KeyError(
            f"Field: '{key}' did not match any known fields. "
            "Please check it exists by viewing `-L/--list-fields`"
        )


@logged_all
def select_fields(
    *,
    group_read_id: bool = False,
    include: Optional[str] = None,
    exclude: Optional[str] = None,
) -> Selection:
    """Select fields to write"""
    selected: Set[str] = set([])

    # Select only read ids
    if group_read_id:
        selected.add("read_id")
        return Selection(selected, selected, set())

    if include:
        for key in include.split(","):
            key = key.strip()
            if not key:
                continue
            get_field_or_raise(key)
            selected.add(key)

    # Default selection - All fields
    if not selected:
        selected.update(FIELDS.keys())

    if exclude:
        for key in exclude.split(","):
            key = key.strip()
            if not key:
                continue
            get_field_or_raise(key)
            try:
                selected.remove(key)
            except KeyError:
                pass

    if not selected:
        raise RuntimeError("Zero Fields selected. Please select at least one field")

    reads_fields: Set[str] = set()
    info_fields: Set[str] = set()

    for field_name in selected:
        field = FIELDS[field_name]
        if field.reads_fields:
            reads_fields.update(field.reads_fields)
        if field.info_fields:
            info_fields.update(field.info_fields)

    # If we use the anything from run_info - add fields to perform the join
    if info_fields:
        reads_fields.update(["run_info"])
        info_fields.update(["acquisition_id"])

    return Selection(selected, reads_fields, info_fields)


def get_format_view_table_fn(
    path: Path, selection: Selection
) -> Callable[[pl.LazyFrame], pl.LazyFrame]:
    """Format the view table based on the selected fields"""
    drop: Set[str] = set()
    exprs: List[pl.Expr] = []
    if "filename" in selection:
        exprs.append(pl.lit(path.name).alias("filename"))
    if "read_id" in selection:
        exprs.append(pl_format_read_id(pl.col("read_id")))
    if "mux" in selection:
        exprs.append(pl.col("well").alias("mux"))
    if "start_time" in selection:
        exprs.append((pl.col("start") / pl.col("sample_rate")).alias("start_time"))
        if "start" not in selection:
            drop.add("start")
        if "sample_rate" not in selection:
            drop.add("sample_rate")
    if "start_sample" in selection:
        exprs.append(pl.col("start").alias("start_sample"))
    if "duration" in selection:
        exprs.append((pl.col("num_samples") / pl.col("sample_rate")).alias("duration"))
        if "num_samples" not in selection:
            drop.add("num_samples")
        if "sample_rate" not in selection:
            drop.add("sample_rate")
    if "minknow_events" in selection:
        exprs.append(pl.col("num_minknow_events").alias("minknow_events"))
    if "run_id" in selection:
        exprs.append(pl.col("protocol_run_id").alias("run_id"))
    if "experiment_id" in selection:
        exprs.append(pl.col("experiment_name").alias("experiment_id"))

    maybe_empty = ["experiment_id", "protocol_run_id", "sample_id", "flow_cell_id"]
    order = [key for key in FIELDS.keys() if key in selection.selected]

    # All tables are the same so we can compute this work ONCE
    def format_view_table(lf: pl.LazyFrame) -> pl.LazyFrame:
        lf = lf.with_columns(exprs)

        # Replace potentially empty fields with "not_set"
        # This can't be done in the above expression due to the behaviour of
        # name.keep()
        empty_cols = [f for f in maybe_empty if f in lf.collect_schema().names()]
        if empty_cols:
            lf = lf.with_columns(
                pl_format_empty_string(pl.col(empty_cols), "not_set").name.keep()
            )

        # Apply the field selection order
        return lf.select(order)

    return format_view_table


@logged(log_time=True)
def write(
    ldf: pl.LazyFrame,
    output: Optional[Path],
    separator: str = "\t",
) -> None:
    """Write the polars.LazyFrame"""

    kwargs = dict(
        include_header=False, separator=separator, null_value="", float_precision=8
    )

    # Write to the nominated output path
    if output is not None:
        with output.open("ab") as f:
            ldf.collect().write_csv(f, **kwargs)
        return

    # No output path, collect the table content as a string and print it to stdout
    content = ldf.collect().write_csv(**kwargs)
    try:
        # Do not add additional newline at the end, this ensures consistency with
        # writing to file
        print(content, end="")
    except BrokenPipeError as exc:
        # https://docs.python.org/3/library/signal.html#note-on-sigpipe
        devnull = os.open(os.devnull, os.O_WRONLY)
        os.dup2(devnull, sys.stdout.fileno())
        raise exc


def write_header(
    output: Optional[Path], selection: Selection, separator: str = "\t"
) -> None:
    """Write the header line"""
    header = separator.join(key for key in FIELDS if key in selection.selected)
    if output is None:
        print(header, file=sys.stdout, flush=True)
    else:
        output.write_text(header + "\n")


@logged_all
def resolve_output(output: Optional[Path], force_overwrite: bool) -> Optional[Path]:
    """
    Resolve the output path if necessary checking for no accidental overwrite
    and resolving to default output if given a path
    """
    if output is None:
        return None

    # Do not allow accidental overwrite
    if output.is_file():
        if not force_overwrite:
            raise FileExistsError(
                f"{output} points to an existing file and --force-overwrite not set"
            )
        output.unlink()

    # If given a directory, check the default filename is valid
    if output.is_dir():
        default_name = output / "view.txt"
        return resolve_output(default_name, force_overwrite)

    return output


@logged()
def assert_unique_acquisition_id(run_info: pl.LazyFrame, path: Path) -> None:
    """
    Perform a check that the acquisition ids are unique raising AssertionError otherwise
    """
    groups = run_info.collect().group_by(pl.col("acquisition_id"))
    common_acq_ids = [acq_id for acq_id, frame in groups if frame.n_unique() != 1]
    if common_acq_ids:
        raise AssertionError(
            f"Found non-unique run_info acquisition_id in {path.name}: {common_acq_ids}. "
        )


def parse_reads_table_all(
    reader: p5.Reader, included_fields: List[int]
) -> pl.LazyFrame:
    """
    Parse all records in the reads table returning a polars LazyFrame
    """
    logger.debug(f"Parsing {reader.path.name} records {included_fields=}")

    options = pa.ipc.IpcReadOptions(included_fields=included_fields)
    with ArrowTableHandle(
        reader.inner_file_reader.get_file_read_table_location(), options=options
    ) as handle:
        reads_table = handle.reader.read_all()
        reads_table = pl_from_arrow(reads_table, rechunk=False).lazy()

    return reads_table


def parse_reads_table_batch(
    reader: p5.Reader, included_fields: List[int], batch_index: int
) -> Tuple[pl.LazyFrame, int]:
    """
    Parse the reads table record batch at `batch_index` from a pod5 file returning a
    polars LazyFrame and the number of records in it
    """
    logger.debug(
        f"Parsing {reader.path.name} record batch {batch_index} {included_fields=}"
    )

    options = pa.ipc.IpcReadOptions(included_fields=included_fields)
    with ArrowTableHandle(
        reader.inner_file_reader.get_file_read_table_location(), options=options
    ) as handle:
        reads_batch = handle.reader.get_record_batch(batch_index)
        num_reads = reads_batch.num_rows
        reads_batch = pl_from_arrow_batch(reads_batch, rechunk=False).lazy()

    return reads_batch, num_reads


@logged_all
def parse_read_table_chunks(
    reader: p5.Reader, included_fields: List[int], approx_size: int = 99_999
) -> Generator[pl.LazyFrame, None, None]:
    """
    Read record batches and yield polars lazyframes of `approx_size` records.
    Records are yielded in units of whole batches of the underlying table
    """
    chunks: List[pl.LazyFrame] = []
    chunk_rows = 0

    for batch_index in range(reader.read_table.num_record_batches):
        reads, n_rows = parse_reads_table_batch(reader, included_fields, batch_index)

        chunks.append(reads)
        chunk_rows += n_rows

        if chunk_rows > approx_size:
            reads_chunk = pl.concat(chunks)
            logger.debug(f"Emitting chunk of {chunk_rows} rows")
            chunks = []
            chunk_rows = 0
            yield reads_chunk

    if chunk_rows > 0:
        reads_chunk = pl.concat(chunks)
        chunks = []
        logger.debug(f"Emitting final chunk of {chunk_rows} rows")
        yield reads_chunk


@logged()
def parse_run_info_table(
    reader: p5.Reader, selection: Selection
) -> Optional[pl.LazyFrame]:
    """Parse the reads table from a pod5 file returning a polars LazyFrame"""
    included_fields: List[int] = []
    for field_idx, name in enumerate(reader.run_info_table.schema.names):
        if name in selection.info_fields:
            included_fields.append(field_idx)

    if not included_fields:
        return None

    options = pa.ipc.IpcReadOptions(included_fields=included_fields)

    with ArrowTableHandle(
        reader.inner_file_reader.get_file_run_info_table_location(), options=options
    ) as handle:
        table = handle.reader.read_all()
        table = pl_from_arrow(table, rechunk=False).lazy()

    assert_unique_acquisition_id(table, reader.path)
    return table


@logged()
def join_reads_to_run_info(reads: pl.LazyFrame, run_info: pl.LazyFrame) -> pl.LazyFrame:
    """Join the reads and run_info tables"""
    return reads.with_columns(pl.col("run_info").cast(pl.Utf8)).join(
        run_info.unique(),
        left_on="run_info",
        right_on="acquisition_id",
    )


def get_included_reads_table_fields(reader: p5.Reader, selection: Selection):
    included_fields: List[int] = []
    for field_idx, name in enumerate(reader.read_table.schema.names):
        if name in selection.reads_fields:
            included_fields.append(field_idx)

    if not included_fields:
        raise KeyError(
            f"No reads fields set in {selection.selected=} {selection.reads_fields=}"
        )
    return included_fields


def get_reads_tables(
    path: Path, selection: Selection, threshold: int = 100_000
) -> Generator[pl.LazyFrame, None, None]:
    """
    Generate lazy dataframes from pod5 records. If the number of records
    is greater than `threshold` then yield chunks to limit memory consumption and
    improve overall performance
    """

    with p5.Reader(path) as reader:
        included_fields = get_included_reads_table_fields(reader, selection)

        format_view_table_fn: Callable[[pl.LazyFrame], pl.LazyFrame] = (
            get_format_view_table_fn(path, selection)
        )

        run_info = parse_run_info_table(reader, selection)

        if reader.num_reads <= threshold:
            reads_table = parse_reads_table_all(reader, included_fields)
            if run_info is not None:
                reads_table = join_reads_to_run_info(reads_table, run_info)

            yield format_view_table_fn(reads_table)
            return

        for reads_chunk in parse_read_table_chunks(
            reader, included_fields, approx_size=threshold - 1
        ):
            if run_info is not None:
                reads_chunk = join_reads_to_run_info(reads_chunk, run_info)
            yield format_view_table_fn(reads_chunk)


def join_workers(processes: List[SpawnProcess], exceptions: mp.JoinableQueue) -> None:
    """Poll workers checking for exceptions which will likely cause"""
    prcs = {p for p in processes}
    while prcs:
        try:
            exc, path = exceptions.get(timeout=0.1)
            terminate_processes(processes)
            exceptions.task_done()
            if isinstance(exc, BrokenPipeError):
                sys.exit(1)
            else:
                terminate_processes(processes)
                raise RuntimeError(f"Error while processing '{path}'") from exc
        except Empty:
            pass

        done = set()
        for prc in prcs:
            exit_code = prc.exitcode

            if exit_code is None:
                continue

            if exit_code > 0:
                terminate_processes(processes)
                raise mp.ProcessError(
                    f"Unexpected exception ocurrecd in {prc} - exit code: {exit_code}"
                )
            else:
                done.add(prc)
        prcs.difference_update(done)

    for prc in processes:
        prc.join()


@logged_all
def worker_process(
    paths: mp.JoinableQueue,
    exceptions: mp.JoinableQueue,
    lock: Lock,
    output: Path,
    separator: bool,
    selection: Selection,
) -> None:
    """
    Consume pod5 paths from `paths` queue, parse the records and write to `output` after
    acquiring `lock`.
    Returns `None` when all finish sentinel `None` is received in `paths` queue.
    """
    path: Optional[Path] = None
    try:
        while True:
            path = paths.get()
            if path is None:
                paths.task_done()
                break

            try:
                for table in get_reads_tables(path, selection):
                    with lock:
                        write(ldf=table, output=output, separator=separator)
            finally:
                paths.task_done()
        paths.close()

    except Exception as exc:
        exceptions.put((exc, path))


def launch_view_workers(
    paths: Set[Path],
    output: Path,
    selection: Selection,
    separator: str,
    num_workers: int,
):
    ctx = mp.get_context("spawn")
    write_lock = ctx.Lock()
    paths_queue = ctx.JoinableQueue(maxsize=len(paths) * 2)
    exceptions_queue = ctx.JoinableQueue(maxsize=len(paths))

    # Prepare the paths queue
    for path in paths:
        paths_queue.put(path)

    processes: List[SpawnProcess] = []
    for _ in range(num_workers):
        worker = ctx.Process(
            target=worker_process,
            kwargs=dict(
                paths=paths_queue,
                exceptions=exceptions_queue,
                lock=write_lock,
                output=output,
                separator=separator,
                selection=selection,
            ),
            daemon=True,
        )
        worker.start()
        processes.append(worker)

        # Enqueue a stop sentinel for each worker
        paths_queue.put(None)

    join_workers(processes, exceptions_queue)

    paths_queue.join()
    paths_queue.close()
    paths_queue.join_thread()


@logged_all
def view_pod5(
    inputs: List[Path],
    output: Path,
    separator: str = "\t",
    recursive: bool = False,
    force_overwrite: bool = False,
    list_fields: bool = False,
    no_header: bool = False,
    threads: int = DEFAULT_THREADS,
    **kwargs,
) -> None:
    """Given a list of POD5 files write a table to view their contents"""

    if list_fields:
        print_fields()
        return

    threads = limit_threads(threads)

    output_path = resolve_output(output, force_overwrite)

    # Decode escaped separator characters e.g. \t
    sep = codecs.decode(separator, "unicode-escape")

    # Parse column selection args
    selection = select_fields(**kwargs)

    collected_paths = collect_inputs(
        inputs, recursive=recursive, pattern="*.pod5", threads=threads
    )
    if not collected_paths:
        raise AssertionError("Found no pod5 files searching inputs")

    num_workers = min(len(collected_paths), threads)

    if not no_header:
        write_header(output=output_path, selection=selection, separator=sep)

    launch_view_workers(
        paths=collected_paths,
        output=output_path,
        selection=selection,
        separator=sep,
        num_workers=num_workers,
    )


def main():
    run_tool(prepare_pod5_view_argparser())


if __name__ == "__main__":
    main()


================================================
FILE: python/pod5/src/pod5/tools/polars_utils.py
================================================
from typing import Optional
import polars as pl
import pyarrow as pa

# Reserved column names used in polars dataframes
PL_DEST_FNAME = "__dest_fname"
PL_SRC_FNAME = "__src_fname"
PL_READ_ID = "__read_id"
PL_UUID_REGEX = "^[0-9a-f]{8}-[0-9a-f]{4}-[0-9a-f]{4}-[0-9a-f]{4}-[0-9a-f]{12}$"


def pl_format_read_id(read_id_col: pl.Expr) -> pl.Expr:
    """Format read ids to in UUID style"""
    read_id = read_id_col.bin.encode("hex")
    return pl.format(
        "{}-{}-{}-{}-{}",
        read_id.str.slice(0, 8),
        read_id.str.slice(8, 4),
        read_id.str.slice(12, 4),
        read_id.str.slice(16, 4),
        read_id.str.slice(20, 12),
    )


def pl_format_empty_string(expr: pl.Expr, subst: Optional[str]) -> pl.Expr:
    """Empty strings are read as a pair of double-quotes which need to be removed"""
    return pl.when(expr.str.len_bytes() == 0).then(pl.lit(subst)).otherwise(expr)


def pl_from_arrow(table: pa.Table, rechunk: bool) -> pl.DataFrame:
    """Workaround failure to read our arrow extension type"""
    # Based on https://github.com/pola-rs/polars/issues/20700

    def remove_pod5_metadata(field: pa.Field) -> pa.Field:
        metadata = field.metadata
        if metadata is not None and metadata.get(b"ARROW:extension:name") in [
            b"minknow.uuid",
            b"minknow.vbz",
        ]:
            del metadata[b"ARROW:extension:name"]
            field = field.remove_metadata().with_metadata(metadata)
        return field

    table = pa.Table.from_batches(
        table.to_batches(),
        schema=pa.schema([remove_pod5_metadata(field) for field in table.schema]),
    )
    return pl.from_arrow(table, rechunk=rechunk)


def pl_from_arrow_batch(record_batch: pa.RecordBatch, rechunk: bool) -> pl.DataFrame:
    """Workaround failure to read our arrow extension type"""
    table = pa.Table.from_batches([record_batch])
    return pl_from_arrow(table, rechunk=rechunk)


================================================
FILE: python/pod5/src/pod5/tools/utils.py
================================================
"""
Utility functions for pod5 tools
"""

import datetime
import functools
import glob
import logging
import multiprocessing as mp
from multiprocessing.context import SpawnProcess
import os
from time import perf_counter
from typing import Collection, Iterable, List, Set, Union
from pathlib import Path
import uuid


# os.cpu_count() can return None if it fails
DEFAULT_THREADS = min(os.cpu_count() or 4, 4)


def init_logging():
    """Initialise logging only if POD5_DEBUG is true"""
    if not is_pod5_debug():
        logger = logging.getLogger("pod5")
        logger.addHandler(logging.NullHandler())
        return logger

    datetime_now = datetime.datetime.now().strftime("%Y-%m-%d--%H-%M-%S")
    if mp.current_process().name == "MainProcess":
        pid = "main"
    else:
        pid = f"p-{os.getpid()}"

    logger = logging.getLogger("pod5")
    logger.setLevel(logging.DEBUG)
    file_handler = logging.FileHandler(filename=f"{datetime_now}-{pid}-pod5.log")
    file_handler.setFormatter(
        logging.Formatter("%(asctime)s %(levelname)s %(message)s")
    )
    file_handler.setLevel(logging.DEBUG)
    logger.addHandler(file_handler)
    return logger


def logged(log_return: bool = False, log_args: bool = False, log_time: bool = False):
    """Logging parameterised decorator"""

    def decorator(func):
        @functools.wraps(func)
        def wrapper(*args, **kwargs):
            logger = logging.getLogger("pod5")
            uid = f"{str(uuid.uuid4())[:2]}:'{func.__name__}'"
            if log_args:
                logger.debug("{0}:{1}, {2}".format(uid, args, kwargs))
            else:
                logger.debug("{0}".format(uid))
            try:
                started = perf_counter()
                ret = func(*args, **kwargs)
            except Exception as exc:
                logger.debug("{0}:Exception:{1}".format(uid, exc))
                raise exc
            if log_time:
                duration_s = perf_counter() - started
                logger.debug("{0}:Done:{1:.3f}s".format(uid, duration_s))
            if log_return:
                logger.debug("{0}:Returned:{1}".format(uid, ret))
            return ret

        return wrapper

    return decorator


logged_all = logged(log_return=True, log_args=True, log_time=True)


@logged_all
def terminate_processes(processes: List[SpawnProcess]) -> None:
    """terminate all child processes"""
    for proc in processes:
        try:
            proc.terminate()
        except ValueError:
            # Catch ValueError raised if proc is already closed
            pass
    return


@logged(log_return=True)
def limit_threads(requested: int) -> int:
    """
    Santise and limit the number of ``requested`` threads to the number of logical cores
    """
    if requested < 1:
        return os.cpu_count() or 4
    return min(os.cpu_count() or requested, requested)


@logged(log_time=True)
def collect_inputs(
    paths: Iterable[Path],
    recursive: bool,
    pattern: Union[str, Collection[str]],
    threads: int = DEFAULT_THREADS,
) -> Set[Path]:
    """
    Returns a set of `path` which match any of the given glob-style `pattern`s

    If a path is a directory this will be globbed (optionally recursively).
    If a path is a file then it must also match any of the given `pattern`s.

    Raises FileExistsError if any inputs do not exist
    """
    paths = set(paths)
    assert_inputs_exist(paths)
    if len(paths) == 0:
        raise AssertionError("Got 0 input paths to search")

    return search_paths(paths, recursive, pattern, min(threads, len(paths)))


@logged(log_time=True, log_return=True)
def assert_inputs_exist(inputs: Iterable[Path]):
    """Assert all inputs exist. Raises FileExistsError otherwise"""
    bad_paths = set()
    for path in set(inputs):
        if not path.exists():
            bad_paths.add(path)

    if bad_paths:
        raise FileExistsError(f"{len(bad_paths)} inputs do not exist: {bad_paths}")


@logged(log_time=True)
def search_paths(
    paths: Iterable[Path],
    recursive: bool,
    pattern: Union[str, Collection[str]],
    threads: int = DEFAULT_THREADS,
) -> Set[Path]:
    """
    Search all `paths` matching any of `patterns` searching directories recursively
    if requested
    """
    if isinstance(pattern, str):
        pattern = [pattern]

    srch = functools.partial(search_path, recursive=recursive, patterns=pattern)

    all_matches: Set[Path] = set()
    with mp.Pool(processes=threads) as pool:
        for matches in pool.imap_unordered(srch, paths):
            all_matches.update(matches)

    return all_matches


@logged(log_time=True)
def search_path(path: Path, recursive: bool, patterns: Collection[str]) -> Set[Path]:
    """
    Search `path` matching `pattern` searching directories recursively if requested
    """

    def _any_match(path: Path):
        return any(path.match(p) for p in patterns)

    # Get the recursive or non-recursive glob function.
    matching_files = set()
    if path.is_dir():
        pattern = str(path / "**" / "*") if recursive else str(path / "*")
        for matching_pathname in glob.glob(pattern, recursive=recursive):
            matching_path = Path(matching_pathname)
            if matching_path.is_file() and _any_match(matching_path):
                matching_files.add(matching_path)

    # Non-directory, assert that it is a file and that it matches the file_pattern
    elif path.is_file() and _any_match(path):
        matching_files.add(path)

    return matching_files


@logged(log_time=True)
def assert_no_duplicate_filenames(inputs: Collection[Path]) -> None:
    """
    Raises ValueError if there are duplicate filenames in the collection of Paths
    """
    names = [path.name for path in inputs]
    if len(names) != len(set(names)):
        raise ValueError(
            "One or more inputs share the same filename. "
            "This would cause a files to be overwritten at runtime"
        )


# Do not log this function as it's executed at import time
def is_disable_pbar() -> bool:
    """Check if POD5_PBAR is set returning true if PBAR should be disabled"""
    try:
        enabled = bool(int(os.environ.get("POD5_PBAR", "1")))
        return not enabled
    except Exception:
        return False


PBAR_DEFAULTS = dict(
    disable=is_disable_pbar(),
    smoothing=0.0,
    dynamic_ncols=True,
    ascii=True,
)


# Do not log this function as it's executed during logging initialisation
def is_pod5_debug() -> bool:
    """Check if POD5_DEBUG is set"""
    try:
        debug = bool(int(os.environ.get("POD5_DEBUG", "0")))
        return debug
    except Exception:
        return True


================================================
FILE: python/pod5/src/pod5/writer.py
================================================
"""
Tools for writing POD5 data
"""

import datetime
import itertools
from pathlib import Path
from typing import (
    Any,
    Callable,
    Dict,
    List,
    Optional,
    Sequence,
    Tuple,
    Type,
    TypeVar,
    Union,
)
import sys

import lib_pod5 as p5b
import numpy as np
from pod5.reader import ReadRecord
import pytz

if sys.version_info >= (3, 10):
    from typing import TypeAlias
else:
    from typing_extensions import TypeAlias

from pod5.api_utils import Pod5ApiException, safe_close
from pod5.pod5_types import (
    BaseRead,
    CompressedRead,
    EndReason,
    PathOrStr,
    Read,
    RunInfo,
)

DEFAULT_SOFTWARE_NAME = "Python API"

SignalType: TypeAlias = p5b.SignalType
"""The type of compression applied to a signal `SignalType::{UncompressedSignal, VbzSignal}`"""
PoreType = str
"""The name of a Pore"""
T = TypeVar("T", bound=Union[EndReason, PoreType, RunInfo])


def force_type_and_default(value, dtype, count, default_value=None):
    if default_value is not None and value is None:
        value = np.array([default_value] * count, dtype=dtype)
    assert value is not None
    return value.astype(type, copy=False)


def map_to_tuples(info_map: Any) -> List[Tuple[str, str]]:
    """
    Convert a fast5 property map (e.g. context_tags and tracking_id) to a
    tuple or string pairs to pass to pod5 C API
    """
    if isinstance(info_map, dict):
        return list((str(key), str(value)) for key, value in info_map.items())
    if isinstance(info_map, list):
        return list((str(item[0]), str(item[1])) for item in info_map)
    raise TypeError(f"Unknown input type for context tags {type(info_map)}")


def timestamp_to_int(time_stamp: Union[datetime.datetime, int]) -> int:
    """Convert a datetime timestamp to an integer if it's not already an integer"""
    if isinstance(time_stamp, int):
        return time_stamp
    return int(time_stamp.astimezone(pytz.utc).timestamp() * 1000)


class Writer:
    """Pod5 File Writer"""

    def __init__(
        self,
        path: PathOrStr,
        software_name: str = DEFAULT_SOFTWARE_NAME,
        signal_compression_type: SignalType = SignalType.VbzSignal,
    ):
        """
        Open a pod5 file for Writing.

        Parameters
        ----------
        path : os.PathLike, str
            The path to the pod5 file to create
        software_name : str
            The name of the application used to create this pod5 file
        signal_compression_type : SignalType
            The type of compression to use in the file. Defaults to Vbz.
        """
        self._path = Path(path).absolute()
        self._software_name = software_name
        self._signal_compression_type = signal_compression_type

        if self._path.is_file():
            raise FileExistsError(
                f"Input path already exists. Refusing to overwrite: {self._path}"
            )

        options = p5b.FileWriterOptions()
        options.signal_compression_type = signal_compression_type

        self._writer: Optional[p5b.FileWriter] = p5b.create_file(
            str(self._path), software_name, options
        )
        if not self._writer:
            raise Pod5ApiException(
                f"Failed to open writer at {self._path} : {p5b.get_error_string()}"
            )

        self._end_reasons: Dict[EndReason, int] = {}
        self._pores: Dict[PoreType, int] = {}
        self._run_infos: Dict[RunInfo, int] = {}

        # Internal lookup of object cache based on their respective type
        self._index_caches: Dict[Type, Dict[Any, int]] = {
            EndReason: self._end_reasons,
            PoreType: self._pores,
            RunInfo: self._run_infos,
        }

        # Internal lookup of _add functions based on their respective type
        self._adder_funcs: Dict[Type, Callable[[Any], int]] = {
            EndReason: self._add_end_reason,
            PoreType: self._add_pore_type,
            RunInfo: self._add_run_info,
        }

    def __enter__(self) -> "Writer":
        return self

    def __exit__(self, *exc_details) -> None:
        self.close()

    def close(self) -> None:
        """Close the FileWriter handle"""
        safe_close(self, "_writer")
        self._writer = None

    @property
    def path(self) -> Path:
        """Return the path to the pod5 file"""
        return self._path

    @property
    def software_name(self) -> str:
        """Return the software name used to open this file"""
        return self._software_name

    @property
    def signal_compression_type(self) -> SignalType:
        """Return the signal compression type used by this file"""
        return self._signal_compression_type

    def add(self, obj: Union[EndReason, PoreType, RunInfo]) -> int:
        """
        Add a `EndReason`, `PoreType`, or
        `RunInfo` object to the Pod5 file (if it doesn't already
        exist) and return the index of this object in the Pod5 file.

        Parameters
        ----------
        obj : Union[EndReason, PoreType, RunInfo]
            Object to find in this Pod5 file, adding it if it doesn't exist already

        Returns
        -------
        index : int
            The index of the object in the Pod5 file
        """
        # Get the index cache for the type of object given
        index_cache = self._index_caches[type(obj)]

        # Return the index of this object if it exists
        if obj in index_cache:
            return index_cache[obj]

        # Add object using the associated adder function e.g. _add_pore(pore: Pore)
        # and store the new index in the cache for future look-ups avoiding duplication
        added_index = self._adder_funcs[type(obj)](obj)
        index_cache[obj] = added_index

        # Return the newly added index
        return added_index

    def _add_end_reason(self, end_reason: EndReason) -> int:
        """Add the given EndReason instance to the pod5 file returning its index"""
        if self._writer is None:
            raise Pod5ApiException("Writer handle has been closed")
        return self._writer.add_end_reason(end_reason.reason.value)

    def _add_pore_type(self, pore_type: PoreType) -> int:
        """Add the given PoreType instance to the pod5 file returning its index"""
        if self._writer is None:
            raise Pod5ApiException("Writer handle has been closed")
        return self._writer.add_pore(pore_type)

    def _add_run_info(self, run_info: RunInfo) -> int:
        """Add the given RunInfo instance to the pod5 file returning its index"""
        if self._writer is None:
            raise Pod5ApiException("Writer handle has been closed")

        return self._writer.add_run_info(
            run_info.acquisition_id,
            timestamp_to_int(run_info.acquisition_start_time),
            run_info.adc_max,
            run_info.adc_min,
            map_to_tuples(run_info.context_tags),
            run_info.experiment_name,
            run_info.flow_cell_id,
            run_info.flow_cell_product_code,
            run_info.protocol_name,
            run_info.protocol_run_id,
            timestamp_to_int(run_info.protocol_start_time),
            run_info.sample_id,
            run_info.sample_rate,
            run_info.sequencing_kit,
            run_info.sequencer_position,
            run_info.sequencer_position_type,
            run_info.software,
            run_info.system_name,
            run_info.system_type,
            map_to_tuples(run_info.tracking_id),
        )

    def contains(self, obj: Union[EndReason, RunInfo]) -> bool:
        """
        Test if this Pod5 file contains the given object.

        Parameters
        ----------
        obj: Union[EndReason, RunInfo]
            Object to find in this Pod5 file

        Returns
        -------
        bool
            True if obj has already been added to this file
        """
        return obj in self._index_caches[type(obj)]

    def find(self, obj: Union[EndReason, RunInfo]) -> int:
        """
        Returns the index of obj in this Pod5 file raising a KeyError if it is missing.

        Parameters
        ----------
        obj: Union[EndReason, RunInfo]
            Obj instance to find in this Pod5 file

        Returns
        -------
        int
            The index of the object in this Pod5 file

        Raises
        ------
        KeyError
            If the object is not in this file
        """
        try:
            return self._index_caches[type(obj)][obj]
        except KeyError as exc:
            raise KeyError(
                f"Could not find index of {obj} in Pod5 file writer: {self}"
            ) from exc

    def add_read(self, read: Union[Read, CompressedRead]) -> None:
        """
        Add a record to the open POD5 file with either compressed or uncompressed
        signal data depending on the given type of Read.

        Parameters
        ----------
        read : Union[Read, CompressedRead]
            POD5 `Read` or `CompressedRead` object to add as a record to the POD5 file.
        """
        self.add_reads([read])

    def add_reads(self, reads: Sequence[Union[Read, CompressedRead]]) -> None:
        """
        Add Read objects (with uncompressed signal data) as records in the open POD5
        file.

        Parameters
        ----------
        reads : Sequence[Union[Read, CompressedRead]
            Sequence of Read or CompressedRead objects to be added to this POD5 file
        """

        # Nothing to do
        if not reads:
            return

        if self._writer is None:
            raise Pod5ApiException("Writer handle has been closed")

        if isinstance(reads[0], Read):
            return self._writer.add_reads(  # type: ignore [call-arg]
                *self._prepare_add_reads_args(reads),
                [r.signal for r in reads],  # type: ignore
            )
        elif isinstance(reads[0], CompressedRead):
            signal_chunks = [r.signal_chunks for r in reads]  # type: ignore
            signal_chunk_lengths = [r.signal_chunk_lengths for r in reads]  # type: ignore

            # Array containing the number of chunks for each signal
            signal_chunk_counts = np.array(
                [len(samples_per_chunk) for samples_per_chunk in signal_chunk_lengths],
                dtype=np.uint32,
            )

            return self._writer.add_reads_pre_compressed(  # type: ignore [call-arg]
                *self._prepare_add_reads_args(reads),
                # Join all signal data into one list
                list(itertools.chain(*signal_chunks)),
                # Join all read sample counts into one array
                np.concatenate(signal_chunk_lengths).astype(np.uint32),  # type: ignore [no-untyped-call]
                signal_chunk_counts,
            )
        elif isinstance(reads[0], ReadRecord):
            raise TypeError(
                "Writer.add_reads(reads) does not take ReadRecords - see ReadRecord.to_read()"
            )
        raise TypeError(f"Writer.add_reads(reads) - unexpected type: {type(reads[0])=}")

    def _prepare_add_reads_args(self, reads: Sequence[BaseRead]) -> List[Any]:
        """
        Converts the List of reads into the list of ctypes arrays of data to be supplied
        to the c api.
        """
        read_id = np.array(
            [np.frombuffer(read.read_id.bytes, dtype=np.uint8) for read in reads]
        )
        read_number = np.array([read.read_number for read in reads], dtype=np.uint32)
        start_sample = np.array([read.start_sample for read in reads], dtype=np.uint64)
        channel = np.array([read.pore.channel for read in reads], dtype=np.uint16)
        well = np.array([read.pore.well for read in reads], dtype=np.uint8)
        pore_type = np.array(
            [self.add(PoreType(read.pore.pore_type)) for read in reads], dtype=np.int16
        )
        calib_offset = np.array(
            [read.calibration.offset for read in reads], dtype=np.float32
        )
        calib_scale = np.array(
            [read.calibration.scale for read in reads], dtype=np.float32
        )
        median_before = np.array(
            [read.median_before for read in reads], dtype=np.float32
        )
        end_reason = np.array(
            [self.add(read.end_reason) for read in reads], dtype=np.int16
        )
        end_reason_forced = np.array(
            [read.end_reason.forced for read in reads], dtype=np.bool_
        )
        run_info = np.array([self.add(read.run_info) for read in reads], dtype=np.int16)
        num_minknow_events = np.array(
            [read.num_minknow_events for read in reads], dtype=np.uint64
        )
        tracked_scaling_scale = np.array(
            [read.tracked_scaling.scale for read in reads], dtype=np.float32
        )
        tracked_scaling_shift = np.array(
            [read.tracked_scaling.shift for read in reads], dtype=np.float32
        )
        predicted_scaling_scale = np.array(
            [read.predicted_scaling.scale for read in reads], dtype=np.float32
        )
        predicted_scaling_shift = np.array(
            [read.predicted_scaling.shift for read in reads], dtype=np.float32
        )
        num_reads_since_mux_change = np.array(
            [read.num_reads_since_mux_change for read in reads], dtype=np.uint32
        )
        time_since_mux_change = np.array(
            [read.time_since_mux_change for read in reads], dtype=np.float32
        )
        open_pore_level = np.array(
            [read.open_pore_level for read in reads], dtype=np.float32
        )

        return [
            read_id.shape[0],
            read_id,
            read_number,
            start_sample,
            channel,
            well,
            pore_type,
            calib_offset,
            calib_scale,
            median_before,
            end_reason,
            end_reason_forced,
            run_info,
            num_minknow_events,
            tracked_scaling_scale,
            tracked_scaling_shift,
            predicted_scaling_scale,
            predicted_scaling_shift,
            num_reads_since_mux_change,
            time_since_mux_change,
            open_pore_level,
        ]


================================================
FILE: python/pod5/src/tests/__init__.py
================================================


================================================
FILE: python/pod5/src/tests/conftest.py
================================================
"""
Pod5 test fixtures
"""

from contextlib import contextmanager
import os
from datetime import datetime, timezone
from pathlib import Path
import psutil
import shutil
import sys
from typing import Generator, Optional, Set
from uuid import UUID, uuid4, uuid5

import numpy
import numpy.typing
from pod5.pod5_types import ShiftScalePair
import pytest
import pod5 as p5

TEST_UUID = uuid4()

TEST_DATA_PATH = Path(__file__).parent.parent.parent.parent.parent / "test_data"
POD5_PATH = TEST_DATA_PATH / "multi_fast5_zip_v4.pod5"

POD5_TEST_SEED = int(os.getenv("POD5_TEST_SEED", numpy.random.randint(1, 9999)))


skip_if_windows = pytest.mark.skipif(
    sys.platform.startswith("win"), reason="no symlink privilege on windows CI"
)


# Run pytest from the tests directory (containing conftest.py) to use this argument
def pytest_addoption(parser):
    """Add configurable random seed for testing"""
    parser.addoption(
        "--pod5-test-seed",
        type=int,
        default=numpy.random.randint(1, 9999),
        help="pod5_factory test seed",
    )


@contextmanager
def assert_no_leaked_handles() -> Generator[None, None, None]:
    proc = psutil.Process()
    before = set(proc.open_files())
    yield
    after = set(proc.open_files())
    leaked_handles = after - before
    leaked_handles = set(h for h in leaked_handles if ".log" not in str(h.path).lower())
    if leaked_handles:
        raise AssertionError(f"Leaked handles: {leaked_handles}")


def assert_no_leaked_handles_win(path: Path) -> None:
    """Attempt to rename the file at `path` this shows up leaked handles on windows"""
    if sys.platform.lower().startswith("win"):
        try:
            os.rename(POD5_PATH, POD5_PATH.with_suffix(".TEMP"))
            os.rename(POD5_PATH.with_suffix(".TEMP"), POD5_PATH)
        except OSError:
            raise AssertionError(f"File handle to {path} still open")


@pytest.fixture(scope="function")
def reader() -> Generator[p5.Reader, None, None]:
    """Create a Reader from a pod5 file"""
    with assert_no_leaked_handles():
        with p5.Reader(path=POD5_PATH) as reader:
            yield reader
    assert_no_leaked_handles_win(POD5_PATH)


@pytest.fixture(scope="function")
def writer(tmp_path: Path) -> Generator[p5.Writer, None, None]:
    """Create a Pod5Writer to a file in a temporary directory"""
    test_pod5 = tmp_path / "test.pod5"
    with p5.Writer(test_pod5) as writer:
        yield writer

    try:
        os.rename(test_pod5, test_pod5.with_suffix(".TEMP"))
        os.rename(test_pod5.with_suffix(".TEMP"), test_pod5)
    except OSError:
        assert False, "File handle still open"


def rand_float(seed: int) -> float:
    """Return a random float in the half-open interval [0, 1)"""
    numpy.random.seed(seed)
    return float(numpy.random.rand(1)[0])


def rand_int(low: int, high: int, seed: int) -> int:
    """Returns a random integer in the half-open interval [low, high)"""
    numpy.random.seed(seed)
    return int(numpy.random.randint(low, high))


def rand_str(prefix: str, seed: int) -> str:
    """Create a random string by appending random integer to prefix"""
    numpy.random.seed(seed)
    return f"{prefix}_{numpy.random.randint(1, 9999999)}"


def _random_read_id(seed: int = 1) -> UUID:
    """Create a random read_id UUID"""
    return uuid5(TEST_UUID, str(seed))


@pytest.fixture(scope="function")
def random_read_id(request) -> UUID:
    """Create a random read_id UUID"""
    return _random_read_id(request.param)


def _random_pore(seed: int) -> p5.Pore:
    """Create a random Pore object"""
    return p5.Pore(
        rand_int(0, 3000, seed), rand_int(0, 4, seed), rand_str("pore_type", seed)
    )


@pytest.fixture(scope="function")
def random_pore(request) -> p5.Pore:
    """Create a random Pore object"""
    return _random_pore(request.param)


def _random_calibration(seed: int = 1) -> p5.Calibration:
    """Create a random Calibration object"""
    return p5.Calibration(rand_float(seed), rand_float(seed + 1))


@pytest.fixture(scope="function")
def random_calibration(request) -> p5.Calibration:
    """Create a random Calibration object"""
    return _random_calibration(request.param)


def _random_end_reason(seed: int = 1) -> p5.EndReason:
    """Create a random EndReason object"""
    return p5.EndReason(
        p5.EndReasonEnum(rand_int(0, 5, seed)), bool(rand_int(0, 1, seed))
    )


@pytest.fixture(scope="function")
def random_end_reason(request) -> p5.EndReason:
    """Create a random EndReason object"""
    return _random_end_reason(request.param)


def _random_run_info(seed: int = 1) -> p5.RunInfo:
    """Create a random RunInfo object"""
    return p5.RunInfo(
        acquisition_id=rand_str("acq_id", seed),
        acquisition_start_time=datetime.fromtimestamp(
            rand_int(0, 1, seed), timezone.utc
        ),
        adc_max=rand_int(0, 1000, seed),
        adc_min=rand_int(-1000, 0, seed),
        context_tags={rand_str("context", seed): rand_str("tag", seed)},
        experiment_name=rand_str("exp_name", seed),
        flow_cell_id=rand_str("flow_cell", seed),
        flow_cell_product_code=rand_str("product_code", seed),
        protocol_name=rand_str("protocol", seed),
        protocol_run_id=rand_str("protocol_run_id", seed),
        protocol_start_time=datetime.fromtimestamp(rand_int(0, 1, seed), timezone.utc),
        sample_id=rand_str("sample_id", seed),
        sample_rate=rand_int(0, 10000, seed),
        sequencing_kit=rand_str("seq_kit", seed),
        sequencer_position=rand_str("position", seed),
        sequencer_position_type=rand_str("position_type", seed),
        software=rand_str("software", seed),
        system_name=rand_str("system_name", seed),
        system_type=rand_str("system_type", seed),
        tracking_id={rand_str("tracking", seed): rand_str("id", seed)},
    )


@pytest.fixture(scope="function")
def random_run_info(request) -> p5.RunInfo:
    """Create a random RunInfo object"""
    return _random_run_info(request.param)


def _random_signal(seed: int = 1) -> numpy.typing.NDArray[numpy.int16]:
    """Generate a random signal"""
    numpy.random.seed(seed)
    size = rand_int(0, 200_000, seed)
    return numpy.random.randint(-32768, 32767, size, dtype=numpy.int16)


@pytest.fixture(scope="function")
def random_signal(request) -> numpy.typing.NDArray[numpy.int16]:
    """Generate a random signal"""
    return _random_signal(request.param)


def _random_read(seed: int = 1) -> p5.Read:
    """Generate a Read with random data"""
    signal = _random_signal(seed)
    return p5.Read(
        read_id=_random_read_id(seed),
        pore=_random_pore(seed),
        calibration=_random_calibration(seed),
        read_number=rand_int(0, 100000, seed),
        start_sample=rand_int(0, 10000000, seed),
        median_before=rand_float(seed),
        end_reason=_random_end_reason(seed),
        run_info=_random_run_info(seed % 4),
        predicted_scaling=ShiftScalePair(rand_float(seed), rand_float(seed + 1)),
        tracked_scaling=ShiftScalePair(rand_float(seed + 2), rand_float(seed + 3)),
        signal=signal,
    )


@pytest.fixture(scope="function")
def random_read(request) -> p5.Read:
    """Generate a Read with random data"""
    return _random_read(request.param)


def _random_read_pre_compressed(seed: int = 1) -> p5.CompressedRead:
    """Generate a Read with random data"""
    signal = _random_signal(seed)
    return p5.CompressedRead(
        read_id=_random_read_id(seed),
        pore=_random_pore(seed),
        calibration=_random_calibration(seed),
        read_number=rand_int(0, 100000, seed),
        start_sample=rand_int(0, 10000000, seed),
        median_before=rand_float(seed),
        end_reason=_random_end_reason(seed),
        run_info=_random_run_info(seed % 4),
        predicted_scaling=ShiftScalePair(rand_float(seed), rand_float(seed + 1)),
        tracked_scaling=ShiftScalePair(rand_float(seed + 2), rand_float(seed + 3)),
        signal_chunks=[p5.vbz_compress_signal(signal)],
        signal_chunk_lengths=[len(signal)],
    )


@pytest.fixture(scope="function")
def random_read_pre_compressed(request) -> p5.CompressedRead:
    """Generate a Read with random data"""
    return _random_read_pre_compressed(request.param)


def _seeder(seed: int) -> Generator[int, None, None]:
    """Generates seed values for numpy.rand.seed"""
    idx = 0
    while True:
        value = (seed + idx) % 2**23
        idx += 13
        yield value


@pytest.fixture(scope="session")
def pod5_factory(request, tmp_path_factory: pytest.TempPathFactory, pytestconfig):
    """
    Create and cache a temporary pod5 file of `n_records` random reads with a
    default name unless given `name_parts` like `subdir/my.pod5`. Files
    are cached under their path and are cleaned.
    """

    POD5_TEST_SEED = pytestconfig.getoption("pod5_test_seed")

    tmp_path = tmp_path_factory.mktemp("pod5_factory")
    existing_pod5s: Set[Path] = set([])

    seeder = _seeder(POD5_TEST_SEED)

    def _pod5_factory(
        n_records: int = 100,
        name: Optional[str] = None,
    ) -> Path:
        """Generate pod5 files with `n_records` with an optionally specified `name`"""
        assert n_records > 0

        if name:
            path = tmp_path / name
        else:
            path = tmp_path / f"pod5_fixture_{n_records}.pod5"

        if path in existing_pod5s:
            if path.is_file():
                return path
            existing_pod5s.remove(path)

        reads = [_random_read(seed=next(seeder)) for _ in range(n_records)]
        with p5.Writer(path=path, software_name="pod5_pytest_fixture") as writer:
            writer.add_reads(reads)

        existing_pod5s.add(path)
        assert path.is_file()
        return path

    yield _pod5_factory

    for path in existing_pod5s:
        path.unlink()

    # Write the test seed to stdout, need to disable capturemanager first
    capmanager = request.config.pluginmanager.getplugin("capturemanager")
    with capmanager.global_and_fixture_disabled():
        print(f"\n\nPOD5_TEST_SEED: {POD5_TEST_SEED}")


@pytest.fixture(scope="session")
def nested_dataset(tmp_path_factory: pytest.TempPathFactory, pod5_factory) -> Path:
    """
    Creates a nested directory structure with temporary pod5 files.

    Symbolic links are only created when not running on windows systems.

    ./root/root_10.pod5
    ./root/subdir/subdir_11.pod5
    ./root/subdir/symbolic_9.pod5 --> ../../outer/symbolic_9.pod5
    ./root/subdir/subsubdir/subsubdir_12.pod5
    ./root/subdir/subsubdir/empty.txt
    ./root/linked/ --> ../linked/

    ./outer/symbolic_9.pod5
    ./linked/linked_8.pod5

    Returns path to root/
    """
    tmp_path = tmp_path_factory.mktemp("pod5_nested_directory")
    root = tmp_path / "root"
    sub_dir = root / "subdir"
    subsub_dir = sub_dir / "subsubdir"
    Path.mkdir(subsub_dir, parents=True)

    root_pod5: Path = pod5_factory(10)
    subdir_pod5: Path = pod5_factory(11)
    subsubdir_pod5: Path = pod5_factory(12)

    shutil.copyfile(str(root_pod5), str(root / "root_10.pod5"))
    shutil.copyfile(str(subdir_pod5), str(sub_dir / "subdir_11.pod5"))
    shutil.copyfile(str(subsubdir_pod5), str(subsub_dir / "subsubdir_12.pod5"))

    (subsub_dir / "empty.txt").touch()

    # Linked file
    outer_dir = tmp_path / "outer"
    Path.mkdir(outer_dir, parents=True)
    symbolic_pod5: Path = pod5_factory(9)
    symb_path = outer_dir / "symbolic_9.pod5"

    if not sys.platform.startswith("win"):
        shutil.copyfile(str(symbolic_pod5), str(symb_path))
        (sub_dir / "symbolic_9.pod5").symlink_to(symb_path)
    else:
        shutil.copyfile(str(symbolic_pod5), str((sub_dir / "symbolic_9.pod5")))

    # Linked directory
    linked_src_dir = tmp_path / "linked"
    Path.mkdir(linked_src_dir, parents=True)
    linked_pod5: Path = pod5_factory(8)
    shutil.copyfile(str(linked_pod5), str(linked_src_dir / "linked_8.pod5"))

    if not sys.platform.startswith("win"):
        (root / "linked").symlink_to(linked_src_dir)
    else:
        (root / "linked").mkdir(parents=True)
        shutil.copyfile(str(linked_pod5), str(root / "linked" / "linked_8.pod5"))

    return root


================================================
FILE: python/pod5/src/tests/test_api.py
================================================
import tempfile
from datetime import datetime, timezone
from pathlib import Path
from typing import Union
from uuid import UUID, uuid4, uuid5

import numpy as np
import pytest

import pod5 as p5
from pod5.api_utils import format_read_ids, pack_read_ids
from pod5.writer import Writer

TEST_UUID = uuid4()


def gen_test_read(seed, compressed=False) -> Union[p5.Read, p5.CompressedRead]:
    np.random.seed(seed)

    def get_random_float() -> float:
        return float(np.random.rand(100000)[0])

    def get_random_int(low: int, high: int) -> int:
        return int(np.random.randint(low, high, 1)[0])

    def get_random_str(prefix: str) -> str:
        return f"{prefix}_{np.random.randint(100000)}"

    size = get_random_int(0, 1000)
    signal = np.random.randint(0, 1024, size, dtype=np.int16)

    cls = p5.Read  # type: ignore
    signal_args = {"signal": signal}  # type: ignore

    if compressed:
        cls = p5.CompressedRead  # type: ignore
        signal_args = {
            "signal_chunks": [p5.signal_tools.vbz_compress_signal(signal)],  # type: ignore
            "signal_chunk_lengths": [len(signal)],  # type: ignore
        }

    return cls(
        uuid5(TEST_UUID, str(seed)),
        p5.Pore(
            get_random_int(0, 3000),
            get_random_int(0, 4),
            get_random_str("pore_type"),
        ),
        p5.Calibration(get_random_float(), get_random_float()),
        get_random_int(0, 100000),
        get_random_int(0, 10000000),
        get_random_float(),
        p5.EndReason(
            p5.EndReasonEnum(get_random_int(0, 5)), bool(get_random_int(0, 1))
        ),
        p5.RunInfo(
            get_random_str("acq_id"),
            datetime.fromtimestamp(get_random_int(0, 1), timezone.utc),
            get_random_int(0, 1000),
            get_random_int(-1000, 0),
            {get_random_str("context"): get_random_str("tag")},
            get_random_str("exp_name"),
            get_random_str("flow_cell"),
            get_random_str("product_code"),
            get_random_str("protocol"),
            get_random_str("protocol_run_id"),
            datetime.fromtimestamp(get_random_int(0, 1), timezone.utc),
            get_random_str("sample_id"),
            get_random_int(0, 10000),
            get_random_str("seq_kit"),
            get_random_str("position"),
            get_random_str("position_type"),
            get_random_str("software"),
            get_random_str("system_name"),
            get_random_str("system_type"),
            {get_random_str("tracking"): get_random_str("id")},
        ),
        num_minknow_events=5,
        tracked_scaling=p5.pod5_types.ShiftScalePair(10.0, 50),
        predicted_scaling=p5.pod5_types.ShiftScalePair(5.0, 100.0),
        num_reads_since_mux_change=123,
        time_since_mux_change=456.0,
        open_pore_level=1234.0,
        **signal_args,
    )


def run_writer_test(f: Writer):
    writer_supports_compressed = f.signal_compression_type == p5.SignalType.VbzSignal

    test_read = gen_test_read(0, compressed=False)
    print("read", test_read.read_id, test_read.run_info.adc_max)
    f.add_read(test_read)

    test_read = gen_test_read(1, compressed=writer_supports_compressed)
    print("read", test_read.read_id, test_read.run_info.adc_max)
    f.add_read(test_read)

    test_reads = [
        gen_test_read(2),
        gen_test_read(3),
        gen_test_read(4),
        gen_test_read(5),
    ]
    print("read", test_reads[0].read_id, test_reads[0].run_info.adc_max)
    f.add_reads(test_reads)

    test_reads = [
        gen_test_read(6, compressed=writer_supports_compressed),
        gen_test_read(7, compressed=writer_supports_compressed),
        gen_test_read(8, compressed=writer_supports_compressed),
        gen_test_read(9, compressed=writer_supports_compressed),
    ]
    f.add_reads(test_reads)
    assert test_reads[0].sample_count > 0


def run_reader_test(reader: p5.Reader):
    # Check top level file metadata

    assert reader.writing_software == "Python API"
    assert reader.file_identifier != UUID(int=0)

    read_count = 0
    read_id_strs = set()
    for idx, read in enumerate(reader.reads()):
        read_count += 1
        data = gen_test_read(idx)

        read_id_strs.add(str(read.read_id))

        assert isinstance(data, p5.Read)

        assert data.read_id == read.read_id
        assert data.read_number == read.read_number
        assert data.start_sample == read.start_sample
        assert pytest.approx(data.median_before) == read.median_before

        assert data.pore == read.pore
        assert pytest.approx(data.calibration.offset) == read.calibration.offset
        assert pytest.approx(data.calibration.scale) == read.calibration.scale
        assert data.run_info == read.run_info
        assert (
            data.run_info.adc_max - data.run_info.adc_min + 1
            == read.calibration_digitisation
        )
        assert (
            pytest.approx(
                data.calibration.scale
                * (data.run_info.adc_max - data.run_info.adc_min + 1)
            )
            == read.calibration_range
        )
        assert data.end_reason.name == read.end_reason.name
        assert data.end_reason.forced == read.end_reason.forced

        assert data.num_minknow_events == read.num_minknow_events
        assert data.tracked_scaling == read.tracked_scaling
        assert data.predicted_scaling == read.predicted_scaling
        assert data.num_reads_since_mux_change == read.num_reads_since_mux_change
        assert data.time_since_mux_change == read.time_since_mux_change
        assert data.open_pore_level == read.open_pore_level

        assert data.sample_count == read.sample_count
        # Expecting poor compression given the random input
        assert 0 < read.byte_count < (len(data.signal) * data.signal.itemsize + 24)
        assert len(read.signal_rows) >= 1

        assert not read.has_cached_signal
        assert (read.signal == data.signal).all()
        assert (
            pytest.approx(read.signal_pa)
            == (data.signal + data.calibration.offset) * data.calibration.scale
        )
        chunk_signals = [read.signal_for_chunk(i) for i in range(len(read.signal_rows))]
        assert (np.concatenate(chunk_signals) == data.signal).all()
        assert isinstance(read.end_reason_index, int)
        assert read.end_reason_index == read.end_reason.reason.value
        assert isinstance(read.run_info_index, int)

    assert reader.num_reads == read_count
    assert set(reader.read_ids) == read_id_strs

    # Try to walk through the file in read batches:
    for idx, batch in enumerate(reader.read_batches(preload={"samples"})):
        assert len(batch.cached_samples_column) == batch.num_reads

    # Try to walk through specific batches in the file:
    for batch in reader.read_batches(batch_selection=[0], preload={"samples"}):
        assert len(batch.cached_samples_column) == batch.num_reads
        assert len(batch.cached_sample_count_column) == batch.num_reads
        for idx, read in enumerate(batch.reads()):
            data = gen_test_read(idx)
            assert isinstance(data, p5.Read)
            assert read.has_cached_signal
            assert (read.signal == data.signal).all()

    # Try to walk through all reads in the file:
    for idx, read in enumerate(reader.reads(preload={"samples"})):
        data = gen_test_read(idx)

        assert isinstance(data, p5.Read)
        assert read.has_cached_signal
        assert (read.signal == data.signal).all()

    # Try to walk through some reads in the file with a bad read id, not ignoring bad ids
    with pytest.raises(RuntimeError):
        for idx, read in enumerate(reader.reads(["bad-id"], missing_ok=False)):
            # Shouldn't hit this!
            assert False

    # Try to walk through some reads in the file with a bad read id, ignoring bad ids
    for idx, read in enumerate(reader.reads(["bad-id"], missing_ok=True)):
        # Shouldn't hit this!
        assert False

    reads = list(reader.reads())
    search_reads = [
        reads[6],
        reads[3],
        reads[1],
    ]

    search = reader.reads([str(r.read_id) for r in search_reads])

    found_ids = set()
    for i, searched_read in enumerate(search):
        found_ids.add(searched_read.read_id)
    assert found_ids == set(r.read_id for r in search_reads)


@pytest.mark.filterwarnings("ignore: pod5.")
def test_pyarrow_from_pathlib():
    with tempfile.TemporaryDirectory() as temp:
        path = Path(temp) / "example.pod5"
        with p5.Writer(path) as _fh:
            run_writer_test(_fh)

        with p5.Reader(path) as _fh:
            run_reader_test(_fh)


@pytest.mark.filterwarnings("ignore: pod5.")
def test_pyarrow_from_str():
    with tempfile.TemporaryDirectory() as temp:
        path = str(Path(temp) / "example.pod5")
        with p5.Writer(path) as _fh:
            run_writer_test(_fh)

        with p5.Reader(path) as _fh:
            run_reader_test(_fh)


@pytest.mark.filterwarnings("ignore: pod5.")
def test_pyarrow_from_pathlib_uncompressed():
    with tempfile.TemporaryDirectory() as temp:
        path = Path(temp) / "example.pod5"
        with p5.Writer(
            path, signal_compression_type=p5.SignalType.UncompressedSignal
        ) as _fh:
            run_writer_test(_fh)

        with p5.Reader(path) as _fh:
            run_reader_test(_fh)


def test_read_id_packing():
    """
    Assert pack_read_ids repacks and format_read_ids correctly unpacks collections
    of read ids
    """
    rids = [str(uuid4()) for _ in range(10)]
    packed_rids = pack_read_ids(rids)

    assert len(rids) == 10
    assert isinstance(packed_rids, np.ndarray)
    assert packed_rids.dtype == np.uint8

    unpacked_rids = format_read_ids(packed_rids)
    assert isinstance(unpacked_rids, list)

    for rid, unpacked in zip(rids, unpacked_rids):
        assert type(rid) is type(unpacked)
        assert rid == unpacked


================================================
FILE: python/pod5/src/tests/test_convert_from_fast5.py
================================================
"""
Test for the convert_from_fast5 tool
"""

import datetime
import multiprocessing as mp
from pathlib import Path
import queue
import sys
from typing import Dict
from unittest.mock import MagicMock, Mock, patch
from uuid import UUID

import h5py
import numpy as np

import pytest

import pod5
from pod5.tools.pod5_convert_from_fast5 import (
    OutputHandler,
    QueueManager,
    convert_datetime_as_epoch_ms,
    convert_fast5_end_reason,
    convert_fast5_files,
    convert_fast5_read,
    convert_from_fast5,
    convert_run_info,
    get_read_from_fast5,
    handle_exception,
    is_multi_read_fast5,
    logger,
)


TEST_DATA_PATH = Path(__file__).parent.parent.parent.parent.parent / "test_data"
FAST5_PATH = TEST_DATA_PATH / "multi_fast5_zip.fast5"

SINGLE_READ_FAST5_PATH = (
    TEST_DATA_PATH
    / "single_read_fast5/fe85b517-62ee-4a33-8767-41cab5d5ab39.fast5.single-read"
)

EXPECTED_POD5_RESULTS = {
    "0000173c-bf67-44e7-9a9c-1ad0bc728e74": pod5.Read(
        read_id=UUID("0000173c-bf67-44e7-9a9c-1ad0bc728e74"),
        pore=pod5.Pore(
            channel=109,
            well=4,
            pore_type="not_set",
        ),
        calibration=pod5.Calibration.from_range(
            offset=21.0,
            adc_range=1437.6976318359375,
            digitisation=8192.0,
        ),
        read_number=1093,
        start_sample=4534321,
        median_before=183.1077423095703,
        end_reason=pod5.EndReason(
            pod5.EndReasonEnum.UNKNOWN,
            False,
        ),
        run_info=pod5.RunInfo(
            acquisition_id="a08e850aaa44c8b56765eee10b386fc3e516a62b",
            acquisition_start_time=datetime.datetime(
                2019, 5, 13, 11, 11, 43, tzinfo=datetime.timezone.utc
            ),
            adc_max=4095,
            adc_min=-4096,
            context_tags={
                "basecall_config_filename": "dna_r9.4.1_450bps_fast.cfg",
                "experiment_duration_set": "180",
                "experiment_type": "genomic_dna",
                "package": "bream4",
                "package_version": "4.0.6",
                "sample_frequency": "4000",
                "sequencing_kit": "sqk-lsk108",
            },
            experiment_name="",
            flow_cell_id="",
            flow_cell_product_code="",
            protocol_name="c449127e3461a521e0865fe6a88716f6f6b0b30c",
            protocol_run_id="df049455-3552-438c-8176-d4a5b1dd9fc5",
            protocol_start_time=datetime.datetime(
                1970, 1, 1, 0, 0, tzinfo=datetime.timezone.utc
            ),
            sample_id="TEST_SAMPLE",
            sample_rate=4000,
            sequencing_kit="sqk-lsk108",
            sequencer_position="MS00000",
            sequencer_position_type="minion",
            software="python-pod5-converter",
            system_name="",
            system_type="",
            tracking_id={
                "asic_id": "131070",
                "asic_id_eeprom": "0",
                "asic_temp": "35.043102",
                "asic_version": "IA02C",
                "auto_update": "0",
                "auto_update_source": "https://mirror.oxfordnanoportal.com/software/MinKNOW/",
                "bream_is_standard": "0",
                "device_id": "MS00000",
                "device_type": "minion",
                "distribution_status": "modified",
                "distribution_version": "unknown",
                "exp_script_name": "c449127e3461a521e0865fe6a88716f6f6b0b30c",
                "exp_script_purpose": "sequencing_run",
                "exp_start_time": "2019-05-13T11:11:43Z",
                "flow_cell_id": "",
                "guppy_version": "3.0.3+7e7b7d0",
                "heatsink_temp": "35.000000",
                "hostname": "happy_fish",
                "installation_type": "prod",
                "local_firmware_file": "1",
                "operating_system": "ubuntu 16.04",
                "protocol_group_id": "TEST_EXPERIMENT",
                "protocol_run_id": "df049455-3552-438c-8176-d4a5b1dd9fc5",
                "protocols_version": "4.0.6",
                "run_id": "a08e850aaa44c8b56765eee10b386fc3e516a62b",
                "sample_id": "TEST_SAMPLE",
                "usb_config": "MinION_fx3_1.1.1_ONT#MinION_fpga_1.1.0#ctrl#Auto",
                "version": "3.4.0-rc3",
            },
        ),
        # Values are not checked but the length here is from manual inspection
        signal=np.array([1] * 123627, dtype=np.int16),
    ),
    "008468c3-e477-46c4-a6e2-7d021a4ebf0b": pod5.Read(
        read_id=UUID("008468c3-e477-46c4-a6e2-7d021a4ebf0b"),
        pore=pod5.Pore(channel=2, well=2, pore_type="not_set"),
        calibration=pod5.Calibration.from_range(
            offset=4.0,
            adc_range=1437.6976318359375,
            digitisation=8192.0,
        ),
        read_number=411,
        start_sample=2510647,
        median_before=219.04641723632812,
        end_reason=pod5.EndReason(reason=pod5.EndReasonEnum.UNKNOWN, forced=False),
        run_info=pod5.RunInfo(
            acquisition_id="a08e850aaa44c8b56765eee10b386fc3e516a62b",
            acquisition_start_time=datetime.datetime(
                2019, 5, 13, 11, 11, 43, tzinfo=datetime.timezone.utc
            ),
            adc_max=4095,
            adc_min=-4096,
            context_tags={
                "basecall_config_filename": "dna_r9.4.1_450bps_fast.cfg",
                "experiment_duration_set": "180",
                "experiment_type": "genomic_dna",
                "package": "bream4",
                "package_version": "4.0.6",
                "sample_frequency": "4000",
                "sequencing_kit": "sqk-lsk108",
            },
            experiment_name="",
            flow_cell_id="",
            flow_cell_product_code="",
            protocol_name="c449127e3461a521e0865fe6a88716f6f6b0b30c",
            protocol_run_id="df049455-3552-438c-8176-d4a5b1dd9fc5",
            protocol_start_time=datetime.datetime(
                1970, 1, 1, 0, 0, tzinfo=datetime.timezone.utc
            ),
            sample_id="TEST_SAMPLE",
            sample_rate=4000,
            sequencing_kit="sqk-lsk108",
            sequencer_position="MS00000",
            sequencer_position_type="minion",
            software="python-pod5-converter",
            system_name="",
            system_type="",
            tracking_id={
                "asic_id": "131070",
                "asic_id_eeprom": "0",
                "asic_temp": "35.043102",
                "asic_version": "IA02C",
                "auto_update": "0",
                "auto_update_source": "https://mirror.oxfordnanoportal.com/software/MinKNOW/",
                "bream_is_standard": "0",
                "device_id": "MS00000",
                "device_type": "minion",
                "distribution_status": "modified",
                "distribution_version": "unknown",
                "exp_script_name": "c449127e3461a521e0865fe6a88716f6f6b0b30c",
                "exp_script_purpose": "sequencing_run",
                "exp_start_time": "2019-05-13T11:11:43Z",
                "flow_cell_id": "",
                "guppy_version": "3.0.3+7e7b7d0",
                "heatsink_temp": "35.000000",
                "hostname": "happy_fish",
                "installation_type": "prod",
                "local_firmware_file": "1",
                "operating_system": "ubuntu 16.04",
                "protocol_group_id": "TEST_EXPERIMENT",
                "protocol_run_id": "df049455-3552-438c-8176-d4a5b1dd9fc5",
                "protocols_version": "4.0.6",
                "run_id": "a08e850aaa44c8b56765eee10b386fc3e516a62b",
                "sample_id": "TEST_SAMPLE",
                "usb_config": "MinION_fx3_1.1.1_ONT#MinION_fpga_1.1.0#ctrl#Auto",
                "version": "3.4.0-rc3",
            },
        ),
        # Values are not checked but the length here is from manual inspection
        signal=np.array([1] * 206976, dtype=np.int16),
    ),
}


def unraisablehook(unraisable):
    print(unraisable.exc_type, unraisable.exc_value, unraisable.exc_traceback)


sys.unraisablehook = unraisablehook


class TestFast5Conversion:
    """Test the fast5 to pod5 conversion"""

    def test_convert_fast5_read(self) -> None:
        """
        Test known good fast5 reads
        """
        run_info_cache: Dict[str, pod5.RunInfo] = {}

        with h5py.File(str(FAST5_PATH), "r") as _f5:
            for read_id, expected_read in EXPECTED_POD5_RESULTS.items():
                read = convert_fast5_read(
                    _f5[f"read_{read_id}"],
                    run_info_cache,
                )

                assert expected_read.end_reason == read.end_reason
                assert expected_read.calibration == read.calibration
                assert expected_read.pore == read.pore
                assert expected_read.run_info == read.run_info
                assert expected_read.read_number == read.read_number
                assert expected_read.start_sample == read.start_sample
                assert expected_read.median_before == read.median_before

                signal = read.decompressed_signal
                assert expected_read.signal.shape[0] == signal.shape[0]
                assert signal.dtype == np.int16

    @pytest.mark.parametrize(
        "fast5,expected",
        [
            (0, pod5.EndReasonEnum.UNKNOWN),
            (1, pod5.EndReasonEnum.UNKNOWN),
            (2, pod5.EndReasonEnum.MUX_CHANGE),
            (3, pod5.EndReasonEnum.UNBLOCK_MUX_CHANGE),
            (4, pod5.EndReasonEnum.DATA_SERVICE_UNBLOCK_MUX_CHANGE),
            (5, pod5.EndReasonEnum.SIGNAL_POSITIVE),
            (6, pod5.EndReasonEnum.SIGNAL_NEGATIVE),
        ],
    )
    def test_end_reason(self, fast5: int, expected: pod5.EndReasonEnum) -> None:
        exp = pod5.EndReason.from_reason_with_default_forced(expected)
        assert exp == convert_fast5_end_reason(fast5)

    def test_convert_run_info_defaults(self) -> None:
        result = convert_run_info(
            acq_id="acq_id",
            adc_max=1,
            adc_min=1,
            sample_rate=1,
            context_tags={},
            device_type="dev_type",
            tracking_id={},
        )

        epoch = convert_datetime_as_epoch_ms(f"{datetime.datetime.utcfromtimestamp(0)}")
        assert isinstance(result, pod5.RunInfo)
        assert result.acquisition_id == "acq_id"
        assert result.acquisition_start_time == epoch
        assert result.adc_max == 1
        assert result.adc_min == 1
        assert result.context_tags == {}
        assert result.experiment_name == ""
        assert result.flow_cell_id == ""
        assert result.flow_cell_product_code == ""
        assert result.protocol_name == ""
        assert result.protocol_run_id == ""
        assert result.protocol_start_time == epoch
        assert result.sample_id == ""
        assert result.sample_rate == 1
        assert result.sequencing_kit == ""
        assert result.sequencer_position == ""
        assert result.sequencer_position_type == "dev_type"
        assert result.software == "python-pod5-converter"
        assert result.system_name == ""
        assert result.system_type == ""
        assert result.tracking_id == {}

    def test_convert_run_info(self) -> None:
        result = convert_run_info(
            acq_id="_acq_id",
            adc_max=2,
            adc_min=3,
            sample_rate=4,
            context_tags={"sequencing_kit": b"sequencing_kit", "ctag": b"ctag"},
            device_type="_dev_type",
            tracking_id={
                "exp_start_time": f"{datetime.datetime.utcfromtimestamp(1)}",
                "flow_cell_id": b"flow_cell_id",
                "flow_cell_product_code": b"flow_cell_product_code",
                "exp_script_name": b"exp_script_name",
                "protocol_run_id": b"protocol_run_id",
                "protocol_start_time": f"{datetime.datetime.utcfromtimestamp(2)}",
                "sample_id": b"sample_id",
                "sequencing_kit": b"sequencing_kit",
                "device_id": b"device_id",
                "device_type": b"device_type",
                "host_product_serial_number": b"host_product_serial_number",
                "host_product_code": b"host_product_code",
            },
        )

        assert isinstance(result, pod5.RunInfo)
        assert result.acquisition_id == "_acq_id"
        assert result.acquisition_start_time == convert_datetime_as_epoch_ms(
            f"{datetime.datetime.utcfromtimestamp(1)}"
        )
        assert result.adc_max == 2
        assert result.adc_min == 3
        assert result.context_tags == {
            "sequencing_kit": "sequencing_kit",
            "ctag": "ctag",
        }
        assert result.experiment_name == ""
        assert result.flow_cell_id == "flow_cell_id"
        assert result.flow_cell_product_code == "flow_cell_product_code"
        assert result.protocol_name == "exp_script_name"
        assert result.protocol_run_id == "protocol_run_id"
        assert result.protocol_start_time == convert_datetime_as_epoch_ms(
            f"{datetime.datetime.utcfromtimestamp(2)}"
        )
        assert result.sample_id == "sample_id"
        assert result.sample_rate == 4
        assert result.sequencing_kit == "sequencing_kit"
        assert result.sequencer_position == "device_id"
        assert result.sequencer_position_type == "device_type"
        assert result.software == "python-pod5-converter"
        assert result.system_name == "host_product_serial_number"
        assert result.system_type == "host_product_code"


class TestFast5Detection:
    def test_single_read_fast5_detection(self):
        """Test single-read fast5 files are detected raising an assertion error"""
        assert not is_multi_read_fast5(SINGLE_READ_FAST5_PATH)

    def test_multi_read_fast5_detection(self):
        """Test multi-read fast5 files are detected not raising an error"""
        assert is_multi_read_fast5(FAST5_PATH)

    def test_read_id_keys_detected(self) -> None:
        """Test that only read_id groups are returned from a known good file"""
        with h5py.File(str(FAST5_PATH), "r") as _f5:
            for group_key in _f5.keys():
                assert get_read_from_fast5(group_key, _f5) is not None

    def test_unknown_keys_ignored(self) -> None:
        """Test that non-read_id keys are ignored"""
        with h5py.File(str(FAST5_PATH), "r") as _f5:
            assert get_read_from_fast5("bad_key", _f5) is None

    def test_bad_keys_skipped_with_warning(self) -> None:
        """Test that read_id keys which are bad are skipped raising a warning"""
        with h5py.File(str(FAST5_PATH), "r") as _f5:
            with pytest.warns(UserWarning, match="Failed to read key"):
                # Good reads should start with read_ prefix. This will cause a key error
                assert get_read_from_fast5("read_bad_key", _f5) is None


class TestConvertBehaviour:
    """Test the runtime behaviour of the conversion tool based on the cli arguments"""

    def test_no_unforced_overwrite(self, tmp_path: Path):
        """Assert that the conversion tool will not overwrite existing files"""

        existing = tmp_path / "exists.pod5"
        existing.touch()
        with pytest.raises(FileExistsError):
            convert_from_fast5(inputs=[FAST5_PATH], output=existing)

    def test_forced_overwrite(self, tmp_path: Path):
        """Assert that the conversion tool will overwrite existing file if forced"""

        existing = tmp_path / "exists.pod5"
        existing.touch()
        convert_from_fast5(inputs=[FAST5_PATH], output=existing, force_overwrite=True)

    def test_directory_output(self, tmp_path: Path):
        """
        Assert that the conversion tool will write to a output directory creating
        a default named output.pod5 file
        """

        assert len(list(tmp_path.rglob("*"))) == 0
        convert_from_fast5(inputs=[FAST5_PATH], output=tmp_path)
        assert len(list(tmp_path.rglob("*.pod5"))) == 1
        assert (tmp_path / "output.pod5").exists()

    def test_single_file_output(self, tmp_path: Path):
        """Assert that the conversion tool will write to a specified file path"""

        output = tmp_path / "filename.pod5"
        assert len(list(tmp_path.rglob("*"))) == 0
        convert_from_fast5(inputs=[FAST5_PATH], output=output)
        assert len(list(tmp_path.rglob("*"))) == 1
        assert output.exists()

    def test_output_121_relative(self, tmp_path: Path):
        """
        Assert that the conversion tool will not write one-to-one files as expected
        """

        clone_1 = tmp_path / "clone1.fast5"
        clone_1.write_bytes(FAST5_PATH.read_bytes())

        clone_2 = tmp_path / "subdir/clone2.fast5"
        clone_2.parent.mkdir(parents=True, exist_ok=False)
        clone_2.write_bytes(FAST5_PATH.read_bytes())

        output = tmp_path / "output"
        output.mkdir(parents=True, exist_ok=True)

        convert_from_fast5(
            inputs=[clone_1, clone_2],
            output=output,
            one_to_one=tmp_path,
            strict=True,
        )

        assert (output / "clone1.pod5").exists()
        assert (output / "subdir/clone2.pod5").exists()

    def test_output_121_relative_no_parents(self, tmp_path: Path):
        """
        Assert that the conversion tool will not write one-to-one files outside of the
        desired output folder
        """

        clone_1 = tmp_path / "relative_parent.fast5"
        clone_1.write_bytes(FAST5_PATH.read_bytes())

        clone_2 = tmp_path / "subdir/clone2.fast5"
        clone_2.parent.mkdir(parents=True, exist_ok=False)
        clone_2.write_bytes(FAST5_PATH.read_bytes())

        output = tmp_path / "output"
        output.mkdir(parents=True, exist_ok=True)

        with pytest.raises(RuntimeError, match="directory must be a relative parent"):
            convert_from_fast5(
                inputs=[clone_1, clone_2],
                output=output,
                one_to_one=tmp_path / "subdir",
                strict=True,
            )


class TestOutputHandler:
    def test_output_handler_default_writer(self, tmp_path: Path):
        """Assert that the OutputHandler creates an output file with default name"""
        handler = OutputHandler(tmp_path, None, False)
        source = tmp_path / "test.fast5"
        writer = handler.get_writer(source)

        assert isinstance(writer, pod5.Writer)
        assert writer.path == tmp_path / "output.pod5"

        handler.close_all()
        assert writer._writer is None
        assert len(list(tmp_path.glob("*.pod5"))) == 1

    def test_output_handler_one_to_one_writer(self, tmp_path: Path):
        """Assert that the OutputHandler creates output name is similar when in 1:1"""
        handler = OutputHandler(tmp_path, tmp_path, False)
        source = tmp_path / "test.fast5"
        writer = handler.get_writer(source)

        assert isinstance(writer, pod5.Writer)
        assert writer.path == tmp_path / "test.pod5"

        handler.close_all()
        assert writer._writer is None
        assert len(list(tmp_path.glob("*.pod5"))) == 1

    def test_output_handler_one_to_one_multiple_writer(self, tmp_path: Path):
        """Assert that the OutputHandler creates output name is similar when in 1:1"""
        handler = OutputHandler(tmp_path, tmp_path, False)

        names = ["test1.fast5", "test2.fast5", "example.fast5"]
        for name in names:
            writer = handler.get_writer(tmp_path / name)

            assert isinstance(writer, pod5.Writer)
            assert writer.path == (tmp_path / name).with_suffix(".pod5")

        assert len(list(tmp_path.glob("*.pod5"))) == len(names)
        handler.close_all()

    def test_no_reopen(self, tmp_path: Path):
        """Assert that the OutputHandler will not overwrite files"""
        handler = OutputHandler(tmp_path, tmp_path, False)
        example = tmp_path / "example"
        handler.get_writer(example)
        handler.set_input_complete(example, is_exception=False)
        with pytest.raises(FileExistsError, match="Trying to re-open"):
            handler.get_writer(example)

    def test_none_if_exception(self, tmp_path: Path):
        """Assert that the OutputHandler will not overwrite files"""
        handler = OutputHandler(tmp_path, tmp_path, False)
        example = tmp_path / "example"
        handler.get_writer(example)
        handler.set_input_complete(example, is_exception=True)
        assert handler.get_writer(example) is None

    def test_no_duplicate_open(self, tmp_path: Path):
        """Assert that the OutputHandler will reuse handles"""
        handler = OutputHandler(tmp_path, tmp_path, False)
        example = tmp_path / "example"
        writer1 = handler.get_writer(example)
        writer2 = handler.get_writer(example)
        assert writer1 == writer2


class TestQueueManager:
    def test_shutdown(self, monkeypatch, caplog: pytest.LogCaptureFixture):
        logger.disabled = False
        monkeypatch.setenv("POD5_DEBUG", "1")
        threads, timeout = 5, 0.05
        ctx = mp.get_context("spawn")
        queues = QueueManager(ctx, [FAST5_PATH], threads, timeout)
        n_inputs, n_req, n_data, n_exc = queues.shutdown()
        assert n_inputs == 1
        assert "Unfinished inputs" in caplog.messages[0]
        assert n_req == threads * 2
        assert n_data == 0
        assert n_exc == 0

        for getter in [
            queues.await_data,
            queues.await_request,
            queues.get_exception,
            queues.get_input,
        ]:
            with pytest.raises((OSError, ValueError), match="is closed"):
                # OSError changed to ValueError in py3.8
                getter()

        queues.shutdown()

    def test_shutdown_with_work(self, monkeypatch, caplog: pytest.LogCaptureFixture):
        logger.disabled = False
        monkeypatch.setenv("POD5_DEBUG", "1")
        threads, timeout = 1, 0.05
        ctx = mp.get_context("spawn")
        queues = QueueManager(ctx, [FAST5_PATH], threads, timeout)
        queues.enqueue_data(None, None)
        queues.enqueue_exception(Path.cwd(), Exception("blah"), "text")
        n_inputs, n_req, n_data, n_exc = queues.shutdown()
        assert n_inputs == 1
        assert "Unfinished inputs" in caplog.messages[0]
        assert n_req == threads * 2
        assert n_data == 1
        assert "Unfinished data" in caplog.messages[1]
        assert n_exc == 1
        assert "Unfinished exceptions" in caplog.messages[2]

        for getter in [
            queues.await_data,
            queues.await_request,
            queues.get_exception,
            queues.get_input,
        ]:
            with pytest.raises((OSError, ValueError), match="is closed"):
                # OSError changed to ValueError in py3.8
                getter()

        queues.shutdown()

    def test_blocked_by_requests(self) -> None:
        threads, timeout = 3, 0.05
        ctx = mp.get_context("spawn")
        queues = QueueManager(ctx, [FAST5_PATH], threads, timeout)
        # Exhaust the requests queue
        for _ in range(queues._requests_size):
            queues.await_request()

        with pytest.raises(TimeoutError, match="No progress"):
            queues.await_request()

        queues.enqueue_request()
        queues.await_request()

        with pytest.raises(TimeoutError, match="No progress"):
            queues.await_data()

        queues.shutdown()

    def test_data_queue(self) -> None:
        threads, timeout = 5, 0.05
        ctx = mp.get_context("spawn")
        queues = QueueManager(ctx, [FAST5_PATH], threads, timeout)

        # Assert initially empty
        with pytest.raises(TimeoutError, match="No progress"):
            queues.await_data()

        queues.enqueue_data(FAST5_PATH, [])
        queues.enqueue_data(FAST5_PATH, 100)
        queues.enqueue_data(None, None)

        queues.await_request()
        assert queues.await_data() == (FAST5_PATH, [])
        assert queues.await_data() == (FAST5_PATH, 100)
        assert queues.await_data() == (None, None)

        # Assert await data for list of reads replaced the request by checking
        # for requests being Full
        queues.enqueue_data(FAST5_PATH, [])
        with pytest.raises(queue.Full):
            queues.await_data()

        # Assert only 1 request taken and replaced
        n_inputs, n_req, n_data, n_exc = queues.shutdown()
        assert n_req == threads * 2

    def test_exception_queue(self) -> None:
        threads, timeout = 5, 0.05
        ctx = mp.get_context("spawn")
        queues = QueueManager(ctx, [FAST5_PATH], threads, timeout)

        # Assert initially empty
        assert queues.get_exception() is None

        queues.enqueue_exception(FAST5_PATH, Exception("foo"), "bar")
        item = queues.get_exception()
        assert item is not None
        path, exc, trace = item
        assert path == FAST5_PATH
        with pytest.raises(Exception, match="foo"):
            raise exc
        assert trace == "bar"

        # Assert only 1 request taken and replaced
        n_inputs, n_req, n_data, n_exc = queues.shutdown()
        assert n_req == threads * 2


class TestConvertLoop:
    def test_convert_fast5_files_file_type_exceptions(self, tmp_path: Path) -> None:
        nf5 = tmp_path / "not_a.fast5"
        nf5.touch()
        threads, timeout = 5, 0.05
        ctx = mp.get_context("spawn")
        queues = QueueManager(ctx, [nf5], threads, timeout)
        convert_fast5_files(queues)

        exception = queues.get_exception()
        assert exception is not None
        path, exc, _ = exception
        assert path == nf5

        queues.shutdown()
        with pytest.raises(TypeError, match="not a multi-read fast5"):
            raise exc

    def test_convert_fast5_files_breaks_loop(self) -> None:
        threads, timeout = 1, 0.05
        ctx = mp.get_context("spawn")
        qm = QueueManager(ctx, [], threads, timeout)
        convert_fast5_files(qm)

        exception = qm.get_exception()
        assert exception is None

        # Assert sentinel enqueued
        path, data = qm.await_data()
        assert path is None
        assert data is None

        qm.shutdown()

    @patch("pod5.tools.pod5_convert_from_fast5.convert_fast5_file")
    def test_convert_fast5_file_exception(self, mock: Mock) -> None:
        threads, timeout = 5, 0.05
        ctx = mp.get_context("spawn")
        qm = QueueManager(ctx, [FAST5_PATH], threads, timeout)
        mock.side_effect = Exception
        convert_fast5_files(qm)
        exception = qm.get_exception()
        assert exception is not None
        path, exc, _ = exception
        assert path == FAST5_PATH
        with pytest.raises(Exception):
            raise exc

        path, data = qm.await_data()
        assert path is None
        assert data is None

        qm.shutdown()

    def test_handle_exception(self) -> None:
        hndlr = MagicMock()
        status = MagicMock()
        exc = (FAST5_PATH, Exception("foo"), "bar")
        with pytest.raises(Exception, match="foo"):
            handle_exception(exc, hndlr, status, True)

        hndlr.set_input_complete.assert_called_once_with(FAST5_PATH, is_exception=True)
        status.write.assert_called_once_with("foo", sys.stderr)
        status.close.assert_called_once()

        assert handle_exception(exc, hndlr, status, False) is None


================================================
FILE: python/pod5/src/tests/test_convert_to_fast5.py
================================================
"""
Test for the convert_from_fast5 tool
"""

from pathlib import Path

import numpy as np
import pytest

import pod5 as p5
from pod5.tools.pod5_convert_from_fast5 import convert_from_fast5
from pod5.tools.pod5_convert_to_fast5 import convert_to_fast5

TEST_DATA_PATH = Path(__file__).parent.parent.parent.parent.parent / "test_data"
FAST5_PATH = TEST_DATA_PATH / "multi_fast5_zip.fast5"
POD5_PATH = TEST_DATA_PATH / "multi_fast5_zip_v4.pod5"


class TestPod5ConversionRoundTrip:
    """Test the pod5 to fast5 conversion and back again to assert consistency"""

    def test_convert_pod5_to_fast5_and_back(self, tmp_path: Path) -> None:
        """
        Test known good pod5 file converts to a fast5 file and back again
        """

        # Convert to fast5
        convert_to_fast5([POD5_PATH], tmp_path, False)

        fast5_paths = list(tmp_path.glob("*.fast5"))
        assert len(fast5_paths) == 1

        # Expected filename has input filename with some extra indexing data
        expected_fast5_name = "multi_fast5_zip_v4.0_0.fast5"
        assert fast5_paths[0].name == expected_fast5_name

        # Convert back to pod5
        convert_from_fast5(fast5_paths, tmp_path)

        pod5_paths = list(tmp_path.glob("*.pod5"))
        assert len(pod5_paths) == 1

        # Ensure we aren't cheating
        assert POD5_PATH != pod5_paths[0]

        expected_tested_reads, count_tested_reads = (10, 0)
        with p5.Reader(POD5_PATH) as original:
            with p5.Reader(pod5_paths[0]) as converted:
                for original_record, converted_record in zip(original, converted):
                    # Assert fields are identical
                    assert original_record.read_id == converted_record.read_id
                    assert original_record.read_number == converted_record.read_number
                    assert (
                        original_record.num_minknow_events
                        == converted_record.num_minknow_events
                    )
                    assert original_record.calibration == converted_record.calibration
                    assert original_record.end_reason == converted_record.end_reason
                    assert original_record.pore == converted_record.pore
                    assert original_record.run_info == converted_record.run_info
                    assert original_record.read_number == converted_record.read_number
                    assert original_record.start_sample == converted_record.start_sample
                    assert original_record.num_samples == converted_record.num_samples
                    assert np.array_equal(
                        original_record.signal, converted_record.signal
                    )

                    count_tested_reads += 1

        # Assert we didn't miss any reads
        assert count_tested_reads == expected_tested_reads


class TestConvertBehaviour:
    """Test the runtime behaviour of the conversion tool based on the cli arguments"""

    def test_no_unforced_overwrite(self, tmp_path: Path):
        """Assert that the conversion tool will not overwrite existing files"""

        existing = tmp_path / "multi_fast5_zip_v4.0_0.fast5"
        existing.touch()
        with pytest.raises(FileExistsError):
            convert_to_fast5(inputs=[POD5_PATH], output=tmp_path, force_overwrite=False)

    def test_forced_overwrite(self, tmp_path: Path):
        """Assert that the conversion tool will overwrite existing file if forced"""

        existing = tmp_path / "multi_fast5_zip_v4.0_0.fast5"
        existing.touch()
        created_time = existing.stat().st_mtime_ns
        convert_to_fast5(inputs=[POD5_PATH], output=tmp_path, force_overwrite=True)

        # Assert the file has been replaces
        assert existing.stat().st_mtime_ns > created_time

    def test_recursive_input(self, tmp_path: Path):
        """Assert that the conversion finds pod5s in subdirs"""

        subdir = tmp_path / "sub/subsub/"
        subdir.mkdir(parents=True)
        src = subdir / "input.pod5"
        src.write_bytes(POD5_PATH.read_bytes())

        convert_to_fast5(inputs=[tmp_path], output=tmp_path, recursive=True)
        assert len(list(tmp_path.glob("*.fast5")))

    def test_multiple_outputs(self, tmp_path: Path):
        """
        Assert that the conversion tool will write multiple files where the
        files-read-count is low
        """
        expect = [
            tmp_path / "multi_fast5_zip_v4.0_0.fast5",
            tmp_path / "multi_fast5_zip_v4.1_0.fast5",
        ]

        assert len(list(tmp_path.rglob("*"))) == 0

        # input reads == 10 so expect 2 files
        convert_to_fast5(inputs=[POD5_PATH], output=tmp_path, file_read_count=5)
        fast5s_found = list(tmp_path.rglob("*.fast5"))
        assert len(fast5s_found) == 2

        for fast5 in fast5s_found:
            assert fast5 in expect


================================================
FILE: python/pod5/src/tests/test_dataset.py
================================================
import random
import shutil
import warnings
from pathlib import Path
from uuid import uuid4

import numpy as np
import pytest

import pod5 as p5
from pod5.api_utils import Pod5ApiException
from pod5.reader import ReadRecord
from tests.conftest import (
    POD5_PATH,
    assert_no_leaked_handles,
    assert_no_leaked_handles_win,
)

POD5_PATH_EXPECTED_NUM_READS = 10

# NO LINKS ON WINDOWS
# nested_dataset/
# ./root/root_10.pod5
# ./root/subdir/subdir_11.pod5
# ./root/subdir/symbolic_9.pod5 --> ../../outer/symbolic_9.pod5
# ./root/subdir/subsubdir/subsubdir_12.pod5
# ./root/subdir/subsubdir/empty.txt
# ./root/linked/ --> ../linked/

# ./outer/symbolic_9.pod5
# ./linked/linked_8.pod5

EXPECT_FILE_COUNT_RECURSIVE = 5
EXPECT_READ_COUNT_RECURSIVE = 8 + 9 + 10 + 11 + 12
EXPECT_FILE_COUNT_ROOT = 1
EXPECT_READ_COUNT_ROOT = 10


class TestDatasetReader:
    """
    Test the DatasetReader
    """

    def test_bad_file_num_reads(self, tmp_path: Path) -> None:
        empty = tmp_path / "empty.pod5"
        empty.touch()

        with p5.DatasetReader(empty) as dataset:
            with pytest.raises(Pod5ApiException, match="DatasetReader error reading:"):
                dataset.num_reads

    def test_len_single(self) -> None:
        assert (
            p5.Reader(POD5_PATH).num_reads
            == len(p5.DatasetReader(POD5_PATH))
            == POD5_PATH_EXPECTED_NUM_READS
        )

    def test_iter_single(self) -> None:
        observed = set()
        for record in p5.DatasetReader(POD5_PATH):
            assert isinstance(record, ReadRecord)
            observed.add(record.read_id)
        assert len(observed) == POD5_PATH_EXPECTED_NUM_READS

    def test_no_recursive(self, nested_dataset: Path) -> None:
        """Test root directory file discovery only"""
        with p5.DatasetReader(nested_dataset) as dataset:
            expected_path = nested_dataset / "root_10.pod5"
            assert dataset._paths == [expected_path]
            assert len(dataset) == 10

            reader = dataset.get_reader(expected_path)
            observed_count = 0
            for reader_read, dataset_read in zip(reader, dataset):
                observed_count += 1
                assert reader_read.read_id == dataset_read.read_id
            assert observed_count == len(dataset)

    def test_recursive(self, nested_dataset: Path) -> None:
        """Test recursive file discovery"""
        dataset = p5.DatasetReader(nested_dataset, recursive=True)

        assert len(dataset.paths) == EXPECT_FILE_COUNT_RECURSIVE
        assert len(dataset) == EXPECT_READ_COUNT_RECURSIVE

        assert dataset._index is None

        # Extremely unlikely that there will be a  collision in 40 UUIDs
        assert not dataset.has_duplicate()
        assert dataset._index is not None
        assert dataset.num_reads == len(dataset._index)

        observed_count = 0
        for path in dataset.paths:
            reader = dataset.get_reader(path)

            for read_id in reader.read_ids:
                observed_count += 1
                read_record = dataset.get_read(read_id=read_id)
                assert read_record is not None
                read_record.read_id == read_id
                isinstance(read_record, ReadRecord)

        assert observed_count == len(dataset)

    def test_get_reader_is_cached(self, nested_dataset: Path) -> None:
        """Tests that a reader is cached"""
        dataset = p5.DatasetReader(nested_dataset)
        root_path = nested_dataset / "root_10.pod5"
        reader = dataset.get_reader(root_path)
        reader_clone = dataset.get_reader(root_path)
        assert id(reader) == id(reader_clone)
        assert isinstance(reader, p5.Reader)
        assert reader.path == root_path

        cache_info = dataset._get_reader.cache_info()  # type: ignore[attr-defined]
        assert cache_info.hits == 1

    def test_reader_all_cache(self, nested_dataset: Path) -> None:
        """Tests that readers are cached and do not leak handles on close"""
        REPEATS = 5000
        with assert_no_leaked_handles():
            ds = p5.DatasetReader(
                nested_dataset, recursive=True, max_cached_readers=None
            )
            paths = ds.paths
            list(ds.get_reader(p) for p in paths * REPEATS)
            cache_info = ds._get_reader.cache_info()  # type: ignore[attr-defined]
            assert cache_info.maxsize is None
            assert cache_info.currsize == len(ds.paths)
            assert cache_info.misses == len(ds.paths)
            assert cache_info.hits == (REPEATS - 1) * len(ds.paths)
            del ds

        for p in paths:
            assert_no_leaked_handles_win(p)

    def test_reader_all_cache_context(self, nested_dataset: Path) -> None:
        """Tests that readers are cached and do not leak handles on close"""
        REPEATS = 5000
        with assert_no_leaked_handles():
            with p5.DatasetReader(
                nested_dataset, recursive=True, max_cached_readers=None
            ) as ds:
                paths = ds.paths
                list(ds.get_reader(p) for p in paths * REPEATS)
                cache_info = ds._get_reader.cache_info()  # type: ignore[attr-defined]
                assert cache_info.maxsize is None
                assert cache_info.currsize == len(ds.paths)
                assert cache_info.misses == len(ds.paths)
                assert cache_info.hits == (REPEATS - 1) * len(ds.paths)

        for p in paths:
            assert_no_leaked_handles_win(p)

    def test_reader_no_cache(self, nested_dataset: Path) -> None:
        """Tests that no reader cache is used if set"""
        REPEATS = 500
        with assert_no_leaked_handles():
            ds = p5.DatasetReader(nested_dataset, recursive=True, max_cached_readers=0)
            paths = ds.paths
            for p in paths * REPEATS:
                ds.get_reader(p)
            cache_info = ds._get_reader.cache_info()  # type: ignore[attr-defined]
            assert cache_info.maxsize == 0
            assert cache_info.currsize == 0
            assert cache_info.misses == REPEATS * len(ds.paths)
            assert cache_info.hits == 0

            # No call to del here tests that the no handles are kept open in the ds

        for p in paths:
            assert_no_leaked_handles_win(p)

    def test_reader_clear_readers(self, nested_dataset: Path) -> None:
        """Tests that the cache is reader cache cleared without leaking handles"""
        REPEATS = 500
        with assert_no_leaked_handles():
            ds = p5.DatasetReader(
                nested_dataset, recursive=True, max_cached_readers=None
            )
            list(ds.get_reader(p) for p in ds.paths * REPEATS)
            cache_info_before = ds._get_reader.cache_info()  # type: ignore[attr-defined]
            assert cache_info_before.currsize > 0
            ds.clear_readers()
            cache_info_after = ds._get_reader.cache_info()  # type: ignore[attr-defined]
            assert cache_info_after.currsize == 0

            # No call to del here tests that the no handles are kept open in the ds

        for p in ds.paths:
            assert_no_leaked_handles_win(p)

    def test_reader_cache_delete(self, nested_dataset: Path) -> None:
        with assert_no_leaked_handles():
            with p5.DatasetReader(
                nested_dataset, recursive=True, max_cached_readers=1
            ) as ds:
                list(ds.get_reader(p) for p in ds.paths)
                cache_info_before = ds._get_reader.cache_info()  # type: ignore[attr-defined]
                assert cache_info_before.currsize == 1
                reader = ds.get_reader(ds.paths[0])
                reader_id = id(reader)
                del reader
                assert reader_id == id(ds.get_reader(ds.paths[0]))

                paths = ds.paths

        for p in paths:
            assert_no_leaked_handles_win(p)

    def test_random_read_indexing(self, nested_dataset: Path) -> None:
        """Test randomly selecting by read id"""
        dataset = p5.DatasetReader(nested_dataset, recursive=True)

        observed_count = 0
        for read_id in sorted(dataset.read_ids):
            observed_count += 1
            read_record = dataset.get_read(read_id)
            assert read_record is not None
            assert str(read_record.read_id) == read_id

        assert observed_count == len(dataset) == EXPECT_READ_COUNT_RECURSIVE

        assert dataset.get_read("") is None
        assert dataset.get_read("foo") is None

    def test_duplicate_read_selection(self, nested_dataset: Path) -> None:
        """Test explicitly selecting a read multiple times"""
        dataset = p5.DatasetReader(nested_dataset, recursive=True)
        all_read_ids = list(dataset.read_ids)
        assert len(all_read_ids) > 0
        read_id = random.choice(all_read_ids)

        selection = [read_id, read_id, read_id]

        loaded_reads = list(dataset.reads(selection=selection))
        assert len(loaded_reads) == len(selection)

        for read in loaded_reads:
            assert str(read.read_id) == read_id
            assert np.array_equal(read.signal, loaded_reads[0].signal)

    def test_missing_id_does_not_return_member(self, nested_dataset: Path) -> None:
        """
        Test that a valid read_id (uuid4) which is not in the dataset doesn't return
        a previously loaded member of the dataset
        """
        dataset = p5.DatasetReader(nested_dataset, recursive=True)
        all_read_ids = list(dataset.read_ids)
        assert len(all_read_ids) > 0

        for _ in range(1_000):
            member_ids = set(random.sample(all_read_ids, len(all_read_ids) // 5))
            assert len(member_ids) > 0

            # Create a read id which is not in the dataset
            missing_id = uuid4()
            assert missing_id not in member_ids, "statistically impossible"
            # Add the missing (but valid) read id to the selection
            selection = list(member_ids)
            selection.append(str(missing_id))

            # Assert only the member read_ids are loaded
            loaded_reads = list(dataset.reads(selection=selection))
            loaded_ids = set(str(read.read_id) for read in loaded_reads)
            assert missing_id not in loaded_ids
            assert loaded_ids == member_ids

    def test_invalid_id_does_not_return_member(self, nested_dataset: Path) -> None:
        """
        Test that invalid selections after valid ones do not return a previous
        valid read
        """
        dataset = p5.DatasetReader(nested_dataset, recursive=True)
        all_read_ids = list(dataset.read_ids)
        assert len(all_read_ids) > 0

        for _ in range(100):
            valid_ids = set(random.sample(all_read_ids, len(all_read_ids) // 5))

            selection = list(valid_ids)
            selection.append("")

            loaded_reads = list(dataset.reads(selection=selection))
            loaded_ids = list(str(read.read_id) for read in loaded_reads)
            assert len(loaded_ids) == len(valid_ids)
            assert set(loaded_ids) == valid_ids

    def test_empty_read_selection(self, nested_dataset: Path) -> None:
        """Test empty selection returns no reads"""
        dataset = p5.DatasetReader(nested_dataset, recursive=True)
        loaded_reads = list(dataset.reads(selection=[]))
        assert len(loaded_reads) == 0

    def test_prompt_read_indexing(self, nested_dataset: Path) -> None:
        """Test prompt indexing"""
        with p5.DatasetReader(nested_dataset, recursive=True, index=True) as ds:
            assert ds._index is not None
            assert len(ds._index) == EXPECT_READ_COUNT_RECURSIVE
            assert set(ds._index.keys()) == set(ds.read_ids)

    def test_iter_multi(self, nested_dataset: Path) -> None:
        """Test __iter__ yields all records"""
        dataset = p5.DatasetReader(nested_dataset, recursive=True)

        observed_count = 0
        for read_record in dataset:
            observed_count += 1

            assert read_record is not None
            assert str(read_record.read_id)

        assert observed_count == len(dataset) == EXPECT_READ_COUNT_RECURSIVE

    def test_iter_multi_single_thread(self, nested_dataset: Path) -> None:
        """
        Test __iter__ yields selected records while threads is one (no multi-threading)
        """
        dataset = p5.DatasetReader(nested_dataset, recursive=True, threads=1)

        expected_count = int(len(dataset) // 1.4)
        sample = random.sample(list(dataset.read_ids), expected_count)

        observed_count = 0
        observed_read_ids = set()
        for read_record in dataset.reads(selection=sample):
            observed_count += 1
            observed_read_ids.add(str(read_record.read_id))

        assert observed_count == expected_count == len(observed_read_ids)
        assert observed_read_ids == set(sample)

    def test_iter_multi_multi_thread(self, nested_dataset: Path) -> None:
        """Test __iter__ yields selected records using multi-threading"""
        dataset = p5.DatasetReader(nested_dataset, recursive=True, threads=4)

        expected_count = int(len(dataset) // 1.3)
        sample = random.sample(list(dataset.read_ids), expected_count)

        observed_count = 0
        observed_read_ids = set()
        for read_record in dataset.reads(selection=sample):
            observed_count += 1
            observed_read_ids.add(str(read_record.read_id))

        assert observed_count == expected_count == len(observed_read_ids)
        assert observed_read_ids == set(sample)

    def test_iter_multi_multi_thread_no_cache(self, nested_dataset: Path) -> None:
        """
        Test __iter__ yields selected records from multiple files while
        multi-threading without caching readers
        """
        dataset = p5.DatasetReader(
            nested_dataset, recursive=True, threads=4, max_cached_readers=0
        )

        expected_count = int(len(dataset) // 1.5)
        sample = random.sample(list(dataset.read_ids), expected_count)

        observed_count = 0
        observed_read_ids = set()
        for read_record in dataset.reads(selection=sample):
            observed_count += 1
            observed_read_ids.add(str(read_record.read_id))

        assert observed_count == expected_count == len(observed_read_ids)
        assert observed_read_ids == set(sample)

    def test_mixed_load(self, nested_dataset: Path) -> None:
        """Test passing file and directory paths"""
        dataset = p5.DatasetReader(
            [nested_dataset, nested_dataset, POD5_PATH, POD5_PATH], recursive=True
        )
        assert len(dataset) == EXPECT_READ_COUNT_RECURSIVE + 10
        assert len(dataset.paths) == EXPECT_FILE_COUNT_RECURSIVE + 1

    def test_iter_selection(self, nested_dataset: Path) -> None:
        """Test read_id selection"""
        dataset = p5.DatasetReader([nested_dataset], recursive=True)

        sample_size = 20
        read_ids = set(random.sample(list(dataset.read_ids), sample_size))
        observed_count = 0
        for read_record in dataset.reads(selection=read_ids):
            observed_count += 1
            assert str(read_record.read_id) in read_ids

        assert observed_count == sample_size

    def test_iter_duplicate(self, nested_dataset: Path) -> None:
        """Selecting duplicate read_ids yields multiple copies"""
        dataset = p5.DatasetReader([nested_dataset], recursive=True)

        sample_size = 5
        multiplier = 2
        duplicated_read_ids = (
            random.sample(list(dataset.read_ids), sample_size) * multiplier
        )
        observed_count = 0
        for read_record in dataset.reads(selection=duplicated_read_ids):
            observed_count += 1
            assert str(read_record.read_id) in set(duplicated_read_ids)

        assert observed_count == sample_size * multiplier

    def test_duplicate(self, tmp_path: Path) -> None:
        """Selecting from duplicate files yields each copy"""
        pod5_copy = tmp_path / "copy.pod5"
        shutil.copyfile(POD5_PATH, pod5_copy)
        dataset = p5.DatasetReader([POD5_PATH, pod5_copy])

        assert dataset.has_duplicate()

        unique_ids = set(dataset.read_ids)
        observed_count = 0
        for read_record in dataset.reads(selection=unique_ids):
            observed_count += 1
            assert str(read_record.read_id) in unique_ids
        assert observed_count == len(unique_ids) * 2

    def test_duplicate_index_warns(self, tmp_path: Path) -> None:
        """Indexing from duplicate files warns of consequences and can be suppressed"""
        pod5_copy = tmp_path / "copy.pod5"
        shutil.copyfile(POD5_PATH, pod5_copy)
        dataset = p5.DatasetReader([POD5_PATH, pod5_copy])

        assert dataset.has_duplicate()
        with pytest.warns(Warning, match="read_ids found in dataset"):
            dataset.get_path(next(dataset.read_ids))

        with pytest.warns(Warning, match="read_ids found in dataset"):
            dataset.get_read(next(dataset.read_ids))

        dataset.warn_duplicate_indexing = False
        with warnings.catch_warnings():
            warnings.simplefilter("error")
            dataset.get_path(next(dataset.read_ids))
            dataset.get_read(next(dataset.read_ids))

    def test_iter_missing(self, nested_dataset: Path) -> None:
        """Missing read_ids are not found"""
        dataset = p5.DatasetReader([nested_dataset], recursive=True)

        sample_size = 5
        read_ids = random.sample(list(dataset.read_ids), sample_size)
        missing_ids = [str(uuid4()) for _ in range(50)]

        observed_count = 0
        for read_record in dataset.reads(selection=read_ids + missing_ids):
            observed_count += 1
            assert str(read_record.read_id) in set(read_ids)

        assert observed_count == sample_size

    def test_get_path(self, nested_dataset: Path) -> None:
        """Get the path to underlying file from read_id"""
        dataset = p5.DatasetReader([nested_dataset], recursive=True)

        assert dataset.get_read(str(uuid4())) is None

        for path in dataset.paths:
            read_id = dataset.get_reader(path).read_ids[0]
            assert dataset.get_path(read_id) == path

    def test_collect_paths(self, nested_dataset: Path) -> None:
        """Pass various inputs to DatasetReader._collect_dataset"""
        collect = p5.DatasetReader._collect_dataset

        expected = {nested_dataset / "root_10.pod5"}
        kwargs = dict(recursive=False, pattern="*.pod5", threads=1)
        assert expected == collect(nested_dataset, **kwargs)  # type: ignore
        assert expected == collect(str(nested_dataset), **kwargs)  # type: ignore

        with pytest.raises(TypeError, match="paths must be a Collection"):
            collect(1, **kwargs)  # type: ignore


================================================
FILE: python/pod5/src/tests/test_filter.py
================================================
from pathlib import Path
from random import sample
from typing import List
from uuid import UUID
from pod5.tools.pod5_view import view_pod5

import polars as pl

import pod5 as p5
from pod5.tools.pod5_filter import parse_read_id_targets, filter_pod5
from pod5.tools.pod5_subset import PL_DEST_FNAME, PL_READ_ID

from tests.conftest import skip_if_windows
import pytest


TEST_DATA_PATH = Path(__file__).parent.parent.parent.parent.parent / "test_data"
POD5_PATH = TEST_DATA_PATH / "multi_fast5_zip_v4.pod5"
READ_IDS_PATH = TEST_DATA_PATH / "subset_mapping_examples/read_ids.txt"

EXPECTED_READ_IDS = [
    "0000173c-bf67-44e7-9a9c-1ad0bc728e74",
    "00925f34-6baf-47fc-b40c-22591e27fb5c",
]


class TestFilterParseIds:
    """Test that pod5 filter parse ids"""

    def _read_ids_path(self, tmp_path: Path, ids: List[str]) -> Path:
        rids = tmp_path / "read_ids.txt"
        rids.write_text("\n".join(ids))
        return rids

    def _assert_columns(self, df: pl.LazyFrame) -> None:
        assert PL_READ_ID in df.collect_schema().names()
        assert PL_DEST_FNAME in df.collect_schema().names()

    def _assert_all_expected(self, df: pl.LazyFrame) -> None:
        read_ids = df.select(PL_READ_ID).collect().to_series().to_list()
        assert len(read_ids) > 0
        assert len(read_ids) == len(EXPECTED_READ_IDS)
        assert set(read_ids) == set(EXPECTED_READ_IDS)

    def test_example(self, tmp_path: Path) -> None:
        """Test known good example to filter"""
        path = self._read_ids_path(tmp_path, EXPECTED_READ_IDS)
        assert len(path.read_text().splitlines()) == 2
        df = parse_read_id_targets(path, Path.cwd())
        self._assert_columns(df)
        self._assert_all_expected(df)

    def test_example_with_header(self, tmp_path: Path) -> None:
        """Test known good example to filter"""
        data = ["read_id"]
        data.extend(EXPECTED_READ_IDS)
        path = self._read_ids_path(tmp_path, data)
        assert len(path.read_text().splitlines()) == 3

        df = parse_read_id_targets(path, Path.cwd())
        self._assert_columns(df)
        self._assert_all_expected(df)

    def test_example_with_comments(self, tmp_path: Path) -> None:
        """Test known good example to filter"""
        data = ["read_id", "#", "# A comment read_id"]
        data.extend(EXPECTED_READ_IDS)
        data.extend(["# Comment"])
        path = self._read_ids_path(tmp_path, data)
        assert len(path.read_text().splitlines()) == 6

        df = parse_read_id_targets(path, Path.cwd())
        self._assert_columns(df)
        self._assert_all_expected(df)

    def test_example_with_whitespace(self, tmp_path: Path) -> None:
        """Test known good example to filter"""
        data = ["read_id", "#", "# A comment read_id", " "]
        data.extend(EXPECTED_READ_IDS)
        data.extend(["# Comment", " "])
        path = self._read_ids_path(tmp_path, data)
        assert len(path.read_text().splitlines()) == 8

        df = parse_read_id_targets(path, Path.cwd())
        self._assert_columns(df)
        self._assert_all_expected(df)

    def test_no_ids(self, tmp_path: Path) -> None:
        """Test known good example to filter"""
        data = ["read_id", "#", "# A comment read_id"]
        path = self._read_ids_path(tmp_path, data)
        assert len(path.read_text().splitlines()) == 3

        with pytest.raises(AssertionError, match="Found 0 read_ids"):
            parse_read_id_targets(path, Path.cwd())


class TestFilter:
    def test_all_in_out(self, tmp_path: Path) -> None:
        """Parse a pod5 file for it's all read_ids and filter expecting all in output"""
        with p5.Reader(POD5_PATH) as reader:
            all_ids = reader.read_ids

        output = tmp_path / "output.pod5"
        read_ids = tmp_path / "read_ids.txt"
        with read_ids.open("w") as _fh:
            _fh.write("\n".join(all_ids))

        assert len(all_ids) > 0
        targets = parse_read_id_targets(read_ids, output)
        assert isinstance(targets, pl.LazyFrame)
        targets = targets.collect()
        assert len(targets) == len(all_ids) == 10
        assert set(targets.get_column(PL_READ_ID)) == set(all_ids)

        filter_pod5(
            [POD5_PATH],
            output,
            read_ids,
            missing_ok=False,
            force_overwrite=False,
            recursive=False,
        )

        assert output.is_file()
        with p5.Reader(output) as reader:
            assert all_ids == reader.read_ids
            assert set(reader.read_ids) == set(targets.get_column(PL_READ_ID))
            assert reader.num_reads > 0

    def test_no_duplicates(self, tmp_path: Path) -> None:
        """Provide duplicate read_ids in the input checking no duplicates are written"""
        with p5.Reader(POD5_PATH) as reader:
            first_id = reader.read_ids[0]

        output = tmp_path / "output.pod5"
        read_ids = tmp_path / "read_ids.txt"
        with read_ids.open("w") as _fh:
            _fh.write("\n".join([first_id, first_id]))

        targets = parse_read_id_targets(read_ids, output)
        assert isinstance(targets, pl.LazyFrame)
        targets = targets.collect()
        assert len(targets) == 1
        assert set(targets.get_column(PL_READ_ID)) == set([first_id])

        filter_pod5(
            [POD5_PATH],
            output,
            read_ids,
            missing_ok=False,
            force_overwrite=False,
            recursive=False,
        )

        assert output.is_file()
        with p5.Reader(output) as reader:
            assert reader.read_ids[0] == first_id
            assert reader.num_reads == 1

    def test_missing_read_ids(self, tmp_path: Path) -> None:
        """Assert that missing read_ids are detected"""
        with p5.Reader(POD5_PATH) as reader:
            all_ids = reader.read_ids

        # Write a known missing read_id
        read_ids = tmp_path / "read_ids.txt"
        with read_ids.open("w") as _fh:
            _fh.write("\n".join(all_ids))
            _fh.write(f"\n{UUID(bytes=b'0'*16)}\n")

        output = tmp_path / "output.pod5"
        with pytest.raises(RuntimeError):
            filter_pod5(
                [POD5_PATH],
                output,
                read_ids,
                missing_ok=False,
                force_overwrite=False,
                recursive=False,
            )
        assert not output.exists()

        filter_pod5(
            [POD5_PATH],
            output,
            read_ids,
            missing_ok=True,
            force_overwrite=False,
            recursive=False,
        )
        assert output.exists()

    def test_force_overwrite(self, tmp_path: Path) -> None:
        """Assert we cannot overwrite outputs without force"""

        output = tmp_path / "output.pod5"
        output.touch()
        with pytest.raises(FileExistsError, match="--force-overwrite not set"):
            filter_pod5(
                [POD5_PATH],
                output,
                READ_IDS_PATH,
                missing_ok=False,
                force_overwrite=False,
                recursive=False,
            )

        assert output.exists()
        filter_pod5(
            [POD5_PATH],
            output,
            READ_IDS_PATH,
            missing_ok=False,
            force_overwrite=True,
            recursive=False,
        )
        assert output.exists()
        with p5.Reader(output) as reader:
            assert reader.num_reads

    def test_empty_input_fails(self, tmp_path: Path) -> None:
        """Request zero reads"""

        empty_file = tmp_path / "empty.txt"
        empty_file.touch()
        output = tmp_path / "output.pod5"

        with pytest.raises(pl.NoDataError, match="empty CSV"):
            filter_pod5(
                [POD5_PATH],
                output,
                empty_file,
                missing_ok=False,
                force_overwrite=False,
                recursive=False,
            )

    @pytest.mark.parametrize("n_reads", [10, 50])
    def test_random_inputs(self, pod5_factory, tmp_path: Path, n_reads: int) -> None:
        p25 = pod5_factory(25)
        p50 = pod5_factory(50)
        p100 = pod5_factory(100)
        pod5s = [p25, p50, p100]
        view_tsv = tmp_path / "view.tsv"
        view_pod5(
            pod5s, view_tsv, include="read_id", no_header=True, force_overwrite=True
        )

        read_ids = sample(list(set(view_tsv.read_text().splitlines())), k=n_reads)
        filter_path = tmp_path / "filter.txt"
        filter_path.write_text("\n".join(read_ids))
        output = tmp_path / "output.pod5"
        filter_pod5(
            pod5s,
            output,
            ids=filter_path,
            missing_ok=False,
            force_overwrite=False,
            recursive=False,
        )

        with p5.Reader(output) as reader:
            assert len(reader.read_ids) == n_reads

    def test_input_directory(self, tmp_path: Path) -> None:
        """Take inputs from directory"""
        output = tmp_path / "output.pod5"
        copy_of = tmp_path / "input.pod5"
        copy_of.write_bytes(POD5_PATH.read_bytes())

        filter_pod5(
            [tmp_path],
            output,
            READ_IDS_PATH,
            missing_ok=False,
            force_overwrite=False,
            recursive=False,
        )

        assert output.exists()
        with p5.Reader(output) as reader:
            assert reader.num_reads

    @skip_if_windows
    def test_recursive_inputs_symlink(self, tmp_path: Path) -> None:
        """Take inputs from directory"""
        output = tmp_path / "output.pod5"

        subdir = tmp_path / "one/two"
        subdir.mkdir(parents=True)
        subdir_symlink = subdir / "input.pod5"
        subdir_symlink.symlink_to(POD5_PATH)

        filter_pod5(
            [tmp_path],
            output,
            READ_IDS_PATH,
            missing_ok=False,
            force_overwrite=False,
            recursive=True,
        )

        assert output.exists()
        with p5.Reader(output) as reader:
            assert reader.num_reads


================================================
FILE: python/pod5/src/tests/test_inspect.py
================================================
from pathlib import Path
import pytest

from pod5.tools.pod5_inspect import inspect_pod5


TEST_DATA_PATH = Path(__file__).parent.parent.parent.parent.parent / "test_data"
POD5_PATH = TEST_DATA_PATH / "multi_fast5_zip_v4.pod5"


class TestReads:
    def test_reads_header_written_once(
        self, capsys: pytest.CaptureFixture, pod5_factory
    ) -> None:
        """Assert that the header line in pod5 inspect reads is only written once"""
        paths = [pod5_factory(10), pod5_factory(25)]

        inspect_pod5("reads", paths)

        lines = str(capsys.readouterr().out).splitlines()
        assert len(lines) == 1 + 10 + 25
        assert sum("read_id" in line for line in lines) == 1


================================================
FILE: python/pod5/src/tests/test_merge.py
================================================
from pathlib import Path

import pytest

import pod5 as p5
from pod5.tools.pod5_merge import merge_pod5

TEST_DATA_PATH = Path(__file__).parent.parent.parent.parent.parent / "test_data"


class TestMerge:
    """Test merge application"""

    def test_merge_runs(self, tmp_path: Path):
        """Test that the merge tool runs a trivial example"""

        # Test all pod5 inputs in test data, which will likely contain duplicates
        inputs = list(TEST_DATA_PATH.glob("split_*pod5"))
        output = tmp_path / "test.pod5"
        merge_pod5(
            inputs[:2],
            output,
            force_overwrite=False,
            recursive=False,
        )

        assert output.exists()

        with p5.Reader(output) as reader:
            reads = list(reader.reads())
            assert reads

    def test_merge_duplicate_stopped(self, tmp_path: Path):
        """Test that the merge tool prevents duplicate reads being merged"""

        # Test all pod5 inputs in test data, which will likely contain duplicates
        inputs = list(TEST_DATA_PATH.glob("*pod5"))
        output = tmp_path / "test.pod5"

        with pytest.raises(RuntimeError, match="Duplicate read id"):
            merge_pod5(inputs, output)


================================================
FILE: python/pod5/src/tests/test_reader.py
================================================
"""
Testing Pod5Reader
"""

import random
from pathlib import Path
from typing import Type
from unittest import mock
from uuid import UUID, uuid4

import lib_pod5 as p5b
import numpy
import numpy.typing
import packaging
import pyarrow as pa
import pytest

import pod5 as p5
from pod5.api_utils import format_read_ids
from pod5.pod5_types import Calibration, EndReason, RunInfo
from pod5.reader import ArrowTableHandle, ReadRecordBatch, SignalRowInfo
from tests.conftest import POD5_PATH


class TestPod5Reader:
    """Test the Pod5Reader from a pod5 file"""

    def test_reader_fixture(self, reader: p5.Reader) -> None:
        """Basic assertions on the reader fixture"""
        assert isinstance(reader, p5.Reader)
        assert isinstance(reader.batch_count, int)
        assert reader.is_vbz_compressed is True
        assert reader.batch_count > 0

    @pytest.mark.parametrize(
        "attribute,expected_type",
        [
            ("calibration", Calibration),
            ("calibration_digitisation", int),
            ("calibration_range", float),
            ("end_reason", EndReason),
            ("read_id", UUID),
            ("read_number", int),
            ("start_sample", int),
            ("median_before", float),
            ("run_info", RunInfo),
            ("num_minknow_events", int),
            ("num_reads_since_mux_change", int),
            ("num_samples", int),
        ],
    )
    def test_reader_reads_types(
        self, reader: p5.Reader, attribute: str, expected_type: Type
    ) -> None:
        """Assert the types returned for reads are consistent with expectations"""
        minimum_reads = 5
        for pod5_read in reader.reads():
            assert isinstance(pod5_read, p5.ReadRecord)
            assert isinstance(getattr(pod5_read, attribute), expected_type)
            minimum_reads -= 1
            if minimum_reads <= 0:
                break
        else:
            assert False, "did not test minimum reads!"

    @pytest.mark.parametrize(
        "attribute,collection_type,dtype",
        [
            ("signal", numpy.ndarray, numpy.int16),
            ("signal_pa", numpy.ndarray, numpy.float32),
        ],
    )
    def test_reader_reads_numpy_types(
        self,
        reader: p5.Reader,
        attribute: str,
        collection_type: Type,
        dtype: numpy.typing.DTypeLike,
    ) -> None:
        """Assert the types returned for reads are consistent with expectations"""
        minimum_reads = 5
        for pod5_read in reader.reads():
            assert isinstance(pod5_read, p5.ReadRecord)
            collection = getattr(pod5_read, attribute)
            assert isinstance(collection, collection_type)
            assert collection.dtype == dtype

            minimum_reads -= 1
            if minimum_reads <= 0:
                break
        else:
            assert False, "did not test minimum reads!"

    @pytest.mark.parametrize(
        "attribute,collection_type,leaf_type",
        [
            ("signal_rows", list, SignalRowInfo),
        ],
    )
    def test_reader_reads_container_types(
        self,
        reader: p5.Reader,
        attribute: str,
        collection_type: Type,
        leaf_type: Type,
    ) -> None:
        """Assert the types returned for reads are consistent with expectations"""
        minimum_reads = 5
        for pod5_read in reader.reads():
            assert isinstance(pod5_read, p5.ReadRecord)
            collection = getattr(pod5_read, attribute)
            assert isinstance(collection, collection_type)
            assert isinstance(collection[0], leaf_type)
            assert isinstance(collection[-1], leaf_type)

            minimum_reads -= 1
            if minimum_reads <= 0:
                break
        else:
            assert False, "did not test minimum reads!"

    def test_attribute_types(self) -> None:
        with p5.Reader(POD5_PATH) as reader:
            assert isinstance(reader.path, Path)
            assert reader.path == POD5_PATH
            assert reader.reads_table_version == 4

            # File handles
            assert isinstance(reader.inner_file_reader, p5b.Pod5FileReader)
            assert isinstance(reader.read_table, pa.ipc.RecordBatchFileReader)
            assert isinstance(reader.run_info_table, pa.ipc.RecordBatchFileReader)
            assert isinstance(reader.signal_table, pa.ipc.RecordBatchFileReader)

            assert isinstance(reader.file_version, packaging.version.Version)
            assert isinstance(
                reader.file_version_pre_migration, packaging.version.Version
            )
            assert isinstance(reader.writing_software, str)
            assert isinstance(reader.file_identifier, UUID)
            assert isinstance(reader.reads_table_version, int)
            assert isinstance(reader.is_vbz_compressed, bool)
            assert isinstance(reader.signal_batch_row_count, int)
            assert isinstance(reader.batch_count, int)
            assert isinstance(reader.num_reads, int)

            assert isinstance(reader.read_ids_raw, pa.ChunkedArray)
            assert isinstance(reader.read_ids, list)
            assert all(isinstance(r, str) for r in reader.read_ids)

            assert isinstance(reader.get_batch(0), ReadRecordBatch)

    def test_without_mmap(self) -> None:
        """Test the file load without mmap for low-memory devices"""
        pod5_file_reader = p5b.open_file(str(POD5_PATH))
        read_table_location = pod5_file_reader.get_file_read_table_location()

        # Raise OSerror when loading with mmap
        mocked = ArrowTableHandle
        mocked._open_reader_with_mmap = mock.Mock(side_effect=OSError)  # type: ignore
        ath = ArrowTableHandle(read_table_location)

        # Assert no handles are opened promptly
        assert ath.reader is not None
        assert ath.reader.num_record_batches > 0

        # Clean reader resources
        del pod5_file_reader

    def test_sparse_file_warns_during_preflight(self, tmp_path: Path, capfd) -> None:
        """Assert sparse/offloaded-like files emit a preflight warning."""
        sparse_path = tmp_path / "sparse-warning.pod5"
        sparse_size_bytes = 128 * 1024 * 1024
        with sparse_path.open("wb") as sparse_file:
            sparse_file.seek(sparse_size_bytes - 1)
            sparse_file.write(b"\0")

        sparse_stats = sparse_path.stat()
        if not hasattr(sparse_stats, "st_blocks"):
            pytest.skip("filesystem does not expose st_blocks")

        allocated_bytes = sparse_stats.st_blocks * 512
        missing_fraction = 1.0 - (allocated_bytes / sparse_stats.st_size)
        if missing_fraction < 0.8:
            pytest.skip("test file is not sparse enough on this filesystem")

        with pytest.raises(RuntimeError):
            p5b.open_file(str(sparse_path))

        captured = capfd.readouterr()
        assert "Warning: POD5 file" in captured.err
        assert "has st_size=" in captured.err
        assert (
            "The file may be sparse or offloaded and open/read operations may fail."
            in captured.err
        )

    def test_iter_selection_in_file_order(self, reader: p5.Reader) -> None:
        """Tests iteration order is on-disk order"""
        shuffled = reader.read_ids
        random.shuffle(shuffled)
        observed_count = 0
        for record, read_id in zip(reader.reads(selection=shuffled), reader.read_ids):
            assert str(record.read_id) == read_id
            observed_count += 1
        assert observed_count == len(reader.read_ids)


class TestRecordBatch:
    def test_get_read(self, pod5_factory) -> None:
        n_reads = 10
        path = pod5_factory(n_reads)
        with p5.Reader(path) as reader:
            reads = list(reader.reads())

            assert reader.batch_count == 1
            batch = reader.get_batch(0)
            assert batch.num_reads == n_reads

            for idx, read in enumerate(reads):
                assert read.read_id == batch.get_read(idx).read_id
            assert n_reads == idx + 1

    def test_column_selection(self, pod5_factory) -> None:
        n_reads = 10
        path = pod5_factory(n_reads)
        with p5.Reader(path) as reader:
            batch = reader.get_batch(0)

            assert len(batch.read_id_column) == n_reads
            assert len(batch.read_number_column) == n_reads

            select_idxs = [3, 4, 8]
            batch.set_selected_batch_rows(select_idxs)

            assert type(batch.read_id_column) is pa.FixedSizeBinaryArray
            assert len(batch.read_id_column) == len(select_idxs)
            ids = [reader.read_ids[idx] for idx in select_idxs]
            assert format_read_ids(batch.read_id_column) == ids

            assert type(batch.read_number_column) is pa.UInt32Array
            assert len(batch.read_number_column) == len(select_idxs)
            reads = list(reader.reads())
            rnums = [reads[idx].read_number for idx in select_idxs]

            # assert type(batch.read_number_column.to_numpy().tolist()) == list
            assert batch.read_number_column.to_numpy().tolist() == rnums

    def test_read_batches(self, pod5_factory) -> None:
        n_reads = 1100
        path = pod5_factory(n_reads)
        with p5.Reader(path) as reader:
            rrb = reader.read_batches
            assert len(list(rrb())) == 2
            assert len(list(rrb(batch_selection=[0]))) == 1
            assert len(list(rrb(batch_selection=[0, 1]))) == 2

    def test_read_batches_raises(self, pod5_factory) -> None:
        n_reads = 1100
        path = pod5_factory(n_reads)
        with p5.Reader(path) as reader:
            # with pytest.raises(AssertionError):
            first, last = reader.read_ids[0], reader.read_ids[-1]
            with pytest.raises(ValueError, match="mutually exclusive"):
                list(reader.read_batches(selection=[first, last], batch_selection=[0]))

            with pytest.raises(RuntimeError, match="Failed to find"):
                list(reader.read_batches(selection=[str(uuid4())]))

    def test_cache_exceptions(self, pod5_factory) -> None:
        n_reads = 10
        path = pod5_factory(n_reads)
        with p5.Reader(path) as reader:
            batch = reader.get_batch(0)

            # No cache set
            with pytest.raises(RuntimeError, match="No cached signal data available"):
                batch.cached_sample_count_column
            with pytest.raises(RuntimeError, match="No cached signal data available"):
                batch.cached_samples_column


================================================
FILE: python/pod5/src/tests/test_recover.py
================================================
import sys
from os.path import exists
from pathlib import Path

import numpy as np

import pytest

import pod5 as p5
from pod5.tools.pod5_recover import recover_pod5

from tests.conftest import _random_read

TEST_DATA_PATH = Path(__file__).parent.parent.parent.parent.parent / "test_data"


class TestRecover:
    """Test recover application"""

    def _generate_recoverable_file(self, dest_path: Path, read_count=1200):
        reads = []
        with p5.Writer(dest_path) as writer:
            for _ in range(read_count):
                read = _random_read()
                reads.append(read)
                writer.add_read(read)

            # Prevent close being called, by keeping a ref to the writer
            self._tmp_file_ref = writer._writer
            # And preventing the p5.Writer from closing it:
            writer._writer = None

        # Check the file is left as tmp:
        assert dest_path.exists()
        assert len(list(dest_path.parent.glob(".*.tmp-run-info"))) == 1
        assert len(list(dest_path.parent.glob(".*.tmp-reads"))) == 1
        return reads

    @pytest.mark.parametrize("cleanup", [False, True])
    def test_recover_runs(
        self, capsys: pytest.CaptureFixture, tmp_path: Path, cleanup: bool
    ):
        """Test that the recover tool runs a trivial example"""

        recoverable_path = tmp_path / "recoverable.tmp"
        added_reads = self._generate_recoverable_file(recoverable_path)

        with pytest.raises(RuntimeError):
            p5.Reader(recoverable_path)

        recover_pod5(
            [recoverable_path], recursive=False, force_overwrite=False, cleanup=cleanup
        )

        expected_recovered_path = recoverable_path.parent / (
            recoverable_path.stem + "_recovered.pod5"
        )

        with p5.Reader(expected_recovered_path) as reader:
            count_recovered = 0
            for read_record, expected_read in zip(reader.reads(), added_reads):
                assert read_record.read_id == expected_read.read_id
                assert read_record.end_reason == expected_read.end_reason
                assert read_record.pore == expected_read.pore
                assert read_record.run_info == expected_read.run_info
                assert np.array_equal(read_record.signal, expected_read.signal)
                count_recovered += 1

            # Only recover in whole batches, so whole 1000 read counts
            expected_recovered_count = (len(added_reads) // 1000) * 1000
            assert count_recovered == expected_recovered_count

        if sys.platform == "win32":
            # Cleanup errors are expected on Windows, because we are still holding input file handles.
            assert exists(recoverable_path)
            if cleanup:
                capture_result = capsys.readouterr()
                assert (
                    "remove: The process cannot access the file because it is being used by another process."
                    in capture_result.out
                )
        else:
            assert exists(recoverable_path) ^ cleanup


================================================
FILE: python/pod5/src/tests/test_repack.py
================================================
from pathlib import Path
import random
from uuid import uuid4
import numpy as np

import pod5 as p5
from pod5.repack import Repacker
from pod5.tools.pod5_repack import repack_pod5
from tests.conftest import skip_if_windows
import pytest


TEST_DATA_PATH = Path(__file__).parent.parent.parent.parent.parent / "test_data"
POD5_PATH = TEST_DATA_PATH / "multi_fast5_zip_v4.pod5"


class TestRepack:
    """Test that pod5 repack runs"""

    def test_works(self, tmp_path: Path) -> None:
        data = tmp_path / "subdir/test.pod5"
        data.parent.mkdir(exist_ok=False, parents=True)
        data.write_bytes(POD5_PATH.read_bytes())

        output = tmp_path / "output"
        assert not (output / "test.pod5").exists()
        repack_pod5(
            [tmp_path], output, threads=2, force_overwrite=False, recursive=True
        )
        assert output.is_dir()
        assert (output / "test.pod5").is_file()

        with p5.Reader(output / "test.pod5") as dest:
            with p5.Reader(data) as source:
                for d_read, s_read in zip(dest, source):
                    assert d_read.read_id == s_read.read_id
                    assert d_read.pore == s_read.pore
                    assert d_read.calibration == s_read.calibration
                    assert np.array_equal(d_read.signal, s_read.signal)

    def test_detect_name_collision(self, tmp_path: Path) -> None:
        data = tmp_path / "subdir/test.pod5"
        data.parent.mkdir(exist_ok=False, parents=True)
        data.write_bytes(POD5_PATH.read_bytes())

        similar_name = tmp_path / "test.pod5"
        similar_name.touch()

        output = tmp_path / "output"
        with pytest.raises(ValueError, match="same filename"):
            repack_pod5(
                [tmp_path], output, threads=2, force_overwrite=False, recursive=True
            )

    @skip_if_windows
    def test_overwrite_symlink(self, tmp_path: Path) -> None:
        symlink = tmp_path / "subdir/test.pod5"
        symlink.parent.mkdir(exist_ok=False, parents=True)
        symlink.symlink_to(POD5_PATH)

        dest = tmp_path / "test.pod5"
        dest.touch()

        with pytest.raises(FileExistsError, match="Refusing to overwrite"):
            repack_pod5(
                [tmp_path / "subdir"],
                tmp_path,
                threads=2,
                force_overwrite=False,
                recursive=True,
            )

        repack_pod5(
            [tmp_path / "subdir"],
            tmp_path,
            threads=2,
            force_overwrite=True,
            recursive=True,
        )

        assert dest.is_file()
        with p5.Reader(dest) as reader:
            assert reader.read_ids

    def test_overwrite_data(self, tmp_path: Path) -> None:
        data = tmp_path / "subdir/test.pod5"
        data.parent.mkdir(exist_ok=False, parents=True)
        data.write_bytes(POD5_PATH.read_bytes())

        dest = tmp_path / "test.pod5"
        dest.touch()

        repack_pod5(
            [tmp_path / "subdir"],
            tmp_path,
            threads=2,
            force_overwrite=True,
            recursive=True,
        )

        assert dest.is_file()
        with p5.Reader(dest) as reader:
            assert reader.read_ids


class TestRepacker:
    def test_add_all(self, tmp_path: Path, pod5_factory) -> None:
        path = pod5_factory(10)

        dest = tmp_path / "dest.pod5"
        repacker = Repacker()
        with p5.Writer(dest) as writer:
            output = repacker.add_output(writer, check_duplicate_read_ids=True)

            assert repacker.reads_requested == 0
            assert repacker.reads_completed == 0
            assert (
                not repacker.is_complete
            )  # Output not marked finished, so not complete

            with p5.Reader(path) as reader:
                repacker.add_all_reads_to_output(output, reader)
            repacker.set_output_finished(output)
            repacker.finish()

            assert repacker.reads_requested == 10
            assert repacker.reads_completed == 10
            assert repacker.is_complete

    def test_add_selection(self, tmp_path: Path, pod5_factory) -> None:
        path = pod5_factory(1100)

        dest = tmp_path / "dest.pod5"
        repacker = Repacker()
        with p5.Writer(dest) as writer:
            output = repacker.add_output(writer)

            with p5.Reader(path) as reader:
                selection = set(random.sample(reader.read_ids, 50))
                repacker.add_selected_reads_to_output(output, reader, selection)

            repacker.set_output_finished(output)
            repacker.finish()

            assert repacker.reads_requested == len(selection)
            assert repacker.reads_completed == len(selection)
            assert repacker.is_complete

        with p5.Reader(dest) as confirm:
            assert set(confirm.read_ids) == set(selection)

        repacker.finish()

    def test_missing_selection(self, tmp_path: Path, pod5_factory) -> None:
        path = pod5_factory(10)

        dest = tmp_path / "dest.pod5"
        repacker = Repacker()
        with p5.Writer(dest) as writer:
            output = repacker.add_output(writer)

            with p5.Reader(path) as reader:
                selection = set([str(uuid4())])
                with pytest.raises(RuntimeError, match="Failed to find"):
                    repacker.add_selected_reads_to_output(output, reader, selection)

            repacker.set_output_finished(output)
            repacker.finish()


================================================
FILE: python/pod5/src/tests/test_signal_tools.py
================================================
"""
Testing signal_tools
"""

from io import TextIOWrapper
from pathlib import Path
import random

import numpy as np
import numpy.typing as npt
from pod5.api_utils import safe_close
import pytest

from pod5.signal_tools import (
    vbz_compress_signal,
    vbz_compress_signal_chunked,
    vbz_decompress_signal,
    vbz_decompress_signal_chunked,
)

TEST_SEEDS = range(10)


class TestPod5SignalTools:
    """Test the POD5 signal_tools module"""

    @pytest.mark.parametrize("random_signal", TEST_SEEDS, indirect=True)
    def test_round_trip(self, random_signal: npt.NDArray[np.int16]) -> None:
        """Test compression and decompression round-trip"""

        sample_count = random_signal.shape[0]
        round_trip_signal = vbz_decompress_signal(
            vbz_compress_signal(random_signal), sample_count
        )
        assert np.array_equal(round_trip_signal, random_signal)

    def test_round_trip_empty(self) -> None:
        """Test compression and decompression round-trip of empty signal data"""
        empty_signal = np.array([], dtype=np.int16)
        sample_count = empty_signal.shape[0]
        round_trip_signal = vbz_decompress_signal(
            vbz_compress_signal(empty_signal), sample_count
        )
        assert np.array_equal(round_trip_signal, empty_signal)

    @pytest.mark.parametrize("random_signal", TEST_SEEDS, indirect=True)
    def test_round_trip_chunked(self, random_signal: npt.NDArray[np.int16]) -> None:
        """Test compression and decompression round-trip for chunked data"""

        sample_count = random_signal.shape[0]
        chunk_size = random.randint(1, 1000)

        compressed_signal_chunked, signal_chunk_lengths = vbz_compress_signal_chunked(
            random_signal, chunk_size
        )

        assert len(compressed_signal_chunked) == len(signal_chunk_lengths)
        assert sample_count == sum(signal_chunk_lengths)

        uncompressed_signal = vbz_decompress_signal_chunked(
            compressed_signal_chunked, signal_chunk_lengths
        )

        assert np.array_equal(uncompressed_signal, random_signal)

    def test_round_trip_chunked_empty(self) -> None:
        """Test compression and decompression round-trip for empty chunked data"""
        empty_signal = np.array([], dtype=np.int16)
        sample_count = empty_signal.shape[0]
        chunk_size = random.randint(1, 1000)

        compressed_signal_chunked, signal_chunk_lengths = vbz_compress_signal_chunked(
            empty_signal, chunk_size
        )

        assert len(compressed_signal_chunked) == len(signal_chunk_lengths)
        assert sample_count == sum(signal_chunk_lengths)

        uncompressed_signal = vbz_decompress_signal_chunked(
            compressed_signal_chunked, signal_chunk_lengths
        )

        assert np.array_equal(uncompressed_signal, empty_signal)


class DemoObj:
    def __init__(self, path: Path) -> None:
        self.handle: TextIOWrapper = path.open("r")
        self.other: str = "other"

    def __del__(self):
        safe_close(self, "handle")


@pytest.fixture
def demo_obj(tmp_path: Path) -> DemoObj:
    path = tmp_path / "example.txt"
    path.touch()
    return DemoObj(path)


class TestSafeClose:
    """Test the safe_close utility"""

    def test_closes(self, demo_obj: DemoObj) -> None:
        """Given a file handle assert it's closed"""
        assert not demo_obj.handle.closed
        safe_close(demo_obj, "handle")
        assert demo_obj.handle.closed

    def test_passes_unknown_attribute(self, demo_obj: DemoObj) -> None:
        """Given a file handle assert it's closed"""
        safe_close(demo_obj, "not_an_attr")
        safe_close(demo_obj, "")

    def test_passes_known_non_handle_attribute(self, demo_obj: DemoObj) -> None:
        """Given a file handle assert it's closed"""
        assert demo_obj.other == "other"
        safe_close(demo_obj, "other")
        assert demo_obj.other == "other"


================================================
FILE: python/pod5/src/tests/test_subset.py
================================================
import subprocess
import sys
from pathlib import Path
from types import ModuleType
from typing import Dict, List, Set

import lib_pod5 as p5b
import polars as pl
import pytest
from polars.testing import assert_frame_equal, assert_series_equal

import pod5
from pod5.tools.pod5_inspect import inspect_pod5
from pod5.tools.pod5_subset import (
    PL_DEST_FNAME,
    PL_READ_ID,
    assert_filename_template,
    build_targets_dict,
    column_keys_from_template,
    create_default_filename_template,
    fstring_to_polars,
    get_separator,
    parse_csv_mapping,
    parse_table_mapping,
    subset_pod5,
)


def get_resource_module() -> ModuleType | None:
    # resource module only available in posix platforms
    # This module is used to set the resource limits when testing subset's
    # file handle / resource management
    try:
        import resource

        return resource
    except ModuleNotFoundError:
        return None


HAS_RLIMIT = hasattr(get_resource_module(), "RLIMIT_NOFILE")

CSV_RESULT_1 = {
    "repeated_name": {"r1", "r2"},
    "multi_read": {"r1", "r2", "r3"},
    "handle_spaces": {"r2", "r3", "r5"},
}

MAPPING = {
    "well-2.pod5": {
        "002fde30-9e23-4125-9eae-d112c18a81a7",
    },
    "well-4.pod5": {
        "00919556-e519-4960-8aa5-c2dfa020980c",
        "0000173c-bf67-44e7-9a9c-1ad0bc728e74",
        "00925f34-6baf-47fc-b40c-22591e27fb5c",
    },
}

MAPPING_REPEATED = {
    "well-2.pod5": {
        "002fde30-9e23-4125-9eae-d112c18a81a7",
        "00925f34-6baf-47fc-b40c-22591e27fb5c",
    },
    "well-4.pod5": {
        "00919556-e519-4960-8aa5-c2dfa020980c",
        "0000173c-bf67-44e7-9a9c-1ad0bc728e74",
        "00925f34-6baf-47fc-b40c-22591e27fb5c",
    },
}

MAPPING_DUPLICATED = {
    "well-2.pod5": {
        "002fde30-9e23-4125-9eae-d112c18a81a7",
        "002fde30-9e23-4125-9eae-d112c18a81a7",
        "002fde30-9e23-4125-9eae-d112c18a81a7",
        "00925f34-6baf-47fc-b40c-22591e27fb5c",
    },
    "well-4.pod5": {
        "00919556-e519-4960-8aa5-c2dfa020980c",
        "0000173c-bf67-44e7-9a9c-1ad0bc728e74",
        "00925f34-6baf-47fc-b40c-22591e27fb5c",
        "00925f34-6baf-47fc-b40c-22591e27fb5c",
    },
}

TEST_DATA_PATH = Path(__file__).parent.parent.parent.parent.parent / "test_data"
POD5_PATH = TEST_DATA_PATH / "multi_fast5_zip_v4.pod5"


class TestSubset:
    """Test that pod5 subset subsets files"""

    @staticmethod
    def csv_mapping_single(path: Path, mapping: Dict[str, Set[str]]) -> Path:
        """read ids are exploded over many lines"""
        output = path / "csv.csv"
        with output.open("w") as _fh:
            for target, read_ids in mapping.items():
                for read_id in read_ids:
                    _fh.write(f"{path / target},{read_id}\n")
        return output

    def _test_subset(self, tmp: Path, csv: Path, mapping: Dict[str, Set[str]]) -> None:
        # Known good mapping

        targets = parse_csv_mapping(csv)
        targets_dict = build_targets_dict(targets)

        p5b.subset_pod5s_with_mapping(
            [POD5_PATH],
            tmp,
            targets_dict,
            # threads=threads,
            False,
            False,
            False,
        )

        # Assert only the expected files are output
        expected_outnames = list(mapping.keys())
        actual_outnames = list(path.name for path in tmp.glob("*.pod5"))
        assert sorted(expected_outnames) == sorted(actual_outnames)

        # Check all read_ids are present in their respective files
        for outname in expected_outnames:
            with pod5.Reader(tmp / outname) as reader:
                assert reader.read_ids
                # Set here asserts that there are no duplicates in putput
                assert sorted(reader.read_ids) == sorted(set(mapping[outname]))

    def test_subset_base(self, tmp_path: Path):
        """Test a known-good basic use case"""
        csv = self.csv_mapping_single(tmp_path, MAPPING)
        self._test_subset(tmp_path, csv, MAPPING)

    def test_subset_shared_read_id(self, tmp_path: Path):
        """Test subsample with a mapping with shared reads_ids in outputs"""
        csv = self.csv_mapping_single(tmp_path, MAPPING_REPEATED)
        self._test_subset(tmp_path, csv, MAPPING_REPEATED)

    def test_subset_duplicate_read_id(self, tmp_path: Path):
        """Test subsample with a mapping with shared reads_ids in outputs"""
        csv = self.csv_mapping_single(tmp_path, MAPPING_REPEATED)
        self._test_subset(tmp_path, csv, MAPPING_REPEATED)

    def test_subset_dir_and_recurse(
        self, tmp_path: Path, capsys: pytest.CaptureFixture
    ) -> None:
        csv = tmp_path / "csv.csv"
        data = tmp_path / "subdir/test.pod5"
        data.parent.mkdir(exist_ok=False, parents=True)
        data.write_bytes(POD5_PATH.read_bytes())

        inspect_pod5("reads", [POD5_PATH])
        captured_stdout = str(capsys.readouterr().out)
        with csv.open("w") as csv_write:
            csv_write.writelines(captured_stdout)

        output = tmp_path / "output_dir"
        subset_pod5(
            [tmp_path],
            output=output,
            csv=None,
            table=csv,
            columns=["well"],
            threads=2,
            template="",
            read_id_column="read_id",
            missing_ok=False,
            ignore_incomplete_template=False,
            force_overwrite=False,
            recursive=True,
        )
        assert output.exists()
        for output_pod5 in output.glob("*.pod5"):
            with pod5.Reader(output_pod5) as reader:
                assert reader.read_ids

    def test_assert_overwrite(self, tmp_path: Path) -> None:
        """Test overwriting existing files if requested"""

        # Create a file we know will be written to in `test_subset_base`:
        (tmp_path / "well-2.pod5").touch()

        # Run the test, expecting an error
        with pytest.raises(RuntimeError):
            self.test_subset_base(tmp_path)

    def _pod5s_with_view_table(
        self, num_input_pod5s: int, tmp_path: Path, pod5_factory
    ) -> tuple[Path, Path]:
        """Create cached pod5s and the view table"""
        pod5_path = Path.cwd()
        num_reads = 0
        print(f"Creating {num_input_pod5s} pod5s for tests")
        for n in range(1, num_input_pod5s):
            num_reads += n
            pod5_path = Path(pod5_factory(n))
        print(f"Finished creating {num_input_pod5s} pod5s for tests")
        # Run pod5 view to create the view table
        from pod5.tools.pod5_view import view_pod5

        table = tmp_path / "view.table"
        view_pod5(
            inputs=[pod5_path.parent],
            output=table,
            recursive=True,
        )

        return pod5_path.parent, table

    @pytest.mark.skipif(not HAS_RLIMIT, reason="POSIX only")
    def test_subset_ulimit_below_num_outputs(
        self, tmp_path: Path, capsys: pytest.CaptureFixture, pod5_factory
    ):
        resource = get_resource_module()
        assert resource is not None

        num_input_pod5s = 50
        pod5_dir, table = self._pod5s_with_view_table(
            num_input_pod5s, tmp_path, pod5_factory
        )
        num_reads = sum(range(num_input_pod5s + 1))  # T(50)=1275

        output = tmp_path / "output_dir"
        cmd = [
            sys.executable,
            "-m",
            "pod5.tools.main",
            "subset",
            "--table",
            str(table),
            "--columns",
            "channel",  # assuming channel * mux is mostly unique
            "mux",
            "--output",
            str(output),
            "--recursive",
            "--force-overwrite",
            str(pod5_dir),
        ]

        def set_nofile_le_num_outputs():
            # Set ulimit below max number of output handles.
            # Using (num_reads / 2) as channel * mux should be unique per read
            soft, hard = resource.getrlimit(resource.RLIMIT_NOFILE)
            rlimit_soft, rlimit_hard = min(num_reads // 3, soft), hard
            resource.setrlimit(resource.RLIMIT_NOFILE, (rlimit_soft, rlimit_hard))

        r = subprocess.run(
            cmd,
            preexec_fn=set_nofile_le_num_outputs,
            capture_output=True,
            text=True,
            check=False,
        )

        assert r.returncode == 0, r.stderr

    @pytest.mark.skipif(not HAS_RLIMIT, reason="POSIX only")
    def test_subset_ulimit_below_num_inputs(
        self, tmp_path: Path, capsys: pytest.CaptureFixture, pod5_factory
    ):
        resource = get_resource_module()
        assert resource is not None

        num_input_pod5s = 50
        pod5_dir, table = self._pod5s_with_view_table(
            num_input_pod5s, tmp_path, pod5_factory
        )

        output = tmp_path / "output_dir"
        cmd = [
            sys.executable,
            "-m",
            "pod5.tools.main",
            "subset",
            "--table",
            str(table),
            "--columns",
            "mux",
            "--output",
            str(output),
            "--recursive",
            "--force-overwrite",
            str(pod5_dir),
        ]

        def set_nofile_le_num_inputs():
            # Set ulimit below max number of input handles.
            soft, hard = resource.getrlimit(resource.RLIMIT_NOFILE)
            rlimit_soft, rlimit_hard = min(num_input_pod5s - 4, soft), hard
            resource.setrlimit(resource.RLIMIT_NOFILE, (rlimit_soft, rlimit_hard))

        r = subprocess.run(
            cmd,
            preexec_fn=set_nofile_le_num_inputs,
            capture_output=True,
            text=True,
            check=False,
        )

        assert r.returncode == 0, r.stderr


class TestFilenameTemplating:
    """Test the output filename templating"""

    @pytest.mark.parametrize(
        "columns,expected",
        [
            (["mux"], "mux-{mux}.pod5"),
            (["mux", "channel"], "mux-{mux}_channel-{channel}.pod5"),
            (["channel", "mux"], "channel-{channel}_mux-{mux}.pod5"),
        ],
    )
    def test_default_template(self, columns: List[str], expected: str):
        template = create_default_filename_template(columns)
        assert template == expected

    @pytest.mark.parametrize(
        "keys,template",
        [
            (["mux"], "mux-{mux}.pod5"),
            (["mux", "channel"], "mux-{mux}_channel-{channel}.pod5"),
            (["channel", "mux"], "channel-{channel}_mux-{mux}.pod5"),
            (["aa", "bb", "aa"], "{aa}_{bb}_{aa}.pod5"),
            (["cc", "cc", "cc"], "!{cc}.{cc}.{cc}"),
            (["cc"], "{{{cc}}}"),
            ([], "{{{}}}"),
            ([], ""),
            ([], "foo.pod5"),
        ],
    )
    def test_column_keys_from_template(self, keys: List[str], template: str) -> None:
        assert keys == column_keys_from_template(template)

    @pytest.mark.parametrize(
        "keys,pl_template,template",
        [
            (["mux"], "mux-{}.pod5", "mux-{mux}.pod5"),
            (["mux", "ch"], "mux-{}_ch-{}.pod5", "mux-{mux}_ch-{ch}.pod5"),
            (["ch", "mux"], "ch-{}_mux-{}.pod5", "ch-{ch}_mux-{mux}.pod5"),
            (["aa", "bb", "aa"], "{}_{}_{}.pod5", "{aa}_{bb}_{aa}.pod5"),
            (["cc", "cc", "cc"], "!{}.{}.{}", "!{cc}.{cc}.{cc}"),
            (["cc"], "{{{}}}", "{{{cc}}}"),
            ([], "{{{}}}", "{{{}}}"),
            ([], "", ""),
            ([], "foo.pod5", "foo.pod5"),
        ],
    )
    def test_fstring_to_polars(
        self, keys: List[str], pl_template: str, template: str
    ) -> None:
        expected_pl, expected_keys = fstring_to_polars(template)
        assert expected_pl == pl_template
        assert expected_keys == keys

    def test_template_assertions(self) -> None:
        with pytest.raises(KeyError):
            assert_filename_template("some_{unknown}.pod5", ["known"], True)

        with pytest.raises(KeyError):
            assert_filename_template("some_{unknown}_{known}.pod5", ["known"], True)

        # Ignore incomplete
        assert_filename_template("some.pod5", ["known"], True)
        with pytest.raises(KeyError):
            assert_filename_template("some.pod5", ["known"], False)


class TestParse:
    def test_csv_separator(self, tmp_path: Path) -> None:
        csv = tmp_path / "csv.csv"
        with csv.open("w") as writer:
            writer.writelines(["this,is,a,csv,line", "some,other,line"])
        assert "," == get_separator(csv)

    def test_tsv_separator(self, tmp_path: Path) -> None:
        tsv = tmp_path / "tsv.tsv"
        with tsv.open("w") as writer:
            writer.writelines(["this\tis\ta\ttab\tline", "some\tother\tline"])
        assert "\t" == get_separator(tsv)

    def _inspect_reads_content(
        self, paths: List[Path], capsys: pytest.CaptureFixture
    ) -> str:
        inspect_pod5("reads", paths)
        return str(capsys.readouterr().out)

    def _write_csv(self, tmp_path: Path, content: str) -> Path:
        csv_path = tmp_path / "table.csv"
        with csv_path.open("w") as csv:
            csv.writelines(content.splitlines(keepends=True))
        return csv_path

    def _write_tsv(self, tmp_path: Path, content: str) -> Path:
        tsv_path = tmp_path / "table.tsv"
        with tsv_path.open("w") as tsv:
            tsv_content = content.replace(",", "\t")
            tsv.writelines(tsv_content.splitlines(keepends=True))
        return tsv_path

    def test_csv_tsv_parse_equal_1(
        self, tmp_path: Path, capsys: pytest.CaptureFixture
    ) -> None:
        content = self._inspect_reads_content([POD5_PATH], capsys)
        csv = self._write_csv(tmp_path=tmp_path, content=content)
        tsv = self._write_tsv(tmp_path=tmp_path, content=content)

        csv_ldf = parse_table_mapping(csv, None, ["channel"])
        tsv_ldf = parse_table_mapping(tsv, None, ["channel"])

        assert isinstance(csv_ldf, pl.LazyFrame)
        assert isinstance(tsv_ldf, pl.LazyFrame)

        csv_channel = csv_ldf.collect()
        tsv_channel = tsv_ldf.collect()

        assert len(csv_channel) > 0
        assert len(csv_channel) == len(tsv_channel)
        assert all(c == t for c, t in zip(csv_channel.rows(), tsv_channel.rows()))
        assert_frame_equal(csv_channel, tsv_channel)

        assert "channel" in csv_channel.columns
        assert PL_READ_ID in csv_channel.columns
        assert PL_DEST_FNAME in csv_channel.columns

        expected_mapping = {
            "channel-109.pod5": ["0000173c-bf67-44e7-9a9c-1ad0bc728e74"],
            "channel-126.pod5": ["007cc97e-6de2-4ff6-a0fd-1c1eca816425"],
            "channel-147.pod5": ["00728efb-2120-4224-87d8-580fbb0bd4b2"],
            "channel-199.pod5": ["00919556-e519-4960-8aa5-c2dfa020980c"],
            "channel-2.pod5": ["008468c3-e477-46c4-a6e2-7d021a4ebf0b"],
            "channel-452.pod5": ["009dc9bd-c5f4-487b-ba4c-b9ce7e3a711e"],
            "channel-463.pod5": ["002fde30-9e23-4125-9eae-d112c18a81a7"],
            "channel-474.pod5": ["008ed3dc-86c2-452f-b107-6877a473d177"],
            "channel-489.pod5": ["006d1319-2877-4b34-85df-34de7250a47b"],
            "channel-53.pod5": ["00925f34-6baf-47fc-b40c-22591e27fb5c"],
        }

        records = []
        for fname, rids in expected_mapping.items():
            records.append([fname, rids])

        expected = (
            pl.from_records(records, schema=[PL_DEST_FNAME, PL_READ_ID], orient="row")
            .explode(PL_READ_ID)
            .with_columns(pl.col(PL_DEST_FNAME).cast(pl.Categorical))
        )

        assert_series_equal(
            expected.get_column(PL_DEST_FNAME).sort(),
            csv_channel.get_column(PL_DEST_FNAME).sort(),
        )
        assert_series_equal(
            expected.get_column(PL_READ_ID).sort(),
            csv_channel.get_column(PL_READ_ID).sort(),
        )

    def test_csv_tsv_parse_equal_2(
        self, tmp_path: Path, capsys: pytest.CaptureFixture
    ) -> None:
        content = self._inspect_reads_content([POD5_PATH], capsys)
        csv = self._write_csv(tmp_path=tmp_path, content=content)
        tsv = self._write_tsv(tmp_path=tmp_path, content=content)

        csv_df = parse_table_mapping(csv, None, ["well", "end_reason"]).collect()
        tsv_df = parse_table_mapping(tsv, None, ["well", "end_reason"]).collect()

        assert len(csv_df) > 0
        assert len(csv_df) == len(tsv_df)
        assert all(c == t for c, t in zip(csv_df.rows(), tsv_df.rows()))
        assert_frame_equal(csv_df, tsv_df)

        assert "well" in csv_df.columns
        assert "end_reason" in csv_df.columns

        expected_mapping = {
            "well-2_end_reason-unknown.pod5": [
                "002fde30-9e23-4125-9eae-d112c18a81a7",
                "009dc9bd-c5f4-487b-ba4c-b9ce7e3a711e",
                "008468c3-e477-46c4-a6e2-7d021a4ebf0b",
                "00728efb-2120-4224-87d8-580fbb0bd4b2",
                "007cc97e-6de2-4ff6-a0fd-1c1eca816425",
            ],
            "well-4_end_reason-unknown.pod5": [
                "00919556-e519-4960-8aa5-c2dfa020980c",
                "0000173c-bf67-44e7-9a9c-1ad0bc728e74",
                "008ed3dc-86c2-452f-b107-6877a473d177",
                "006d1319-2877-4b34-85df-34de7250a47b",
                "00925f34-6baf-47fc-b40c-22591e27fb5c",
            ],
        }

        records = []
        for fname, rids in expected_mapping.items():
            records.append([fname, rids])

        expected = (
            pl.from_records(records, schema=[PL_DEST_FNAME, PL_READ_ID], orient="row")
            .explode(PL_READ_ID)
            .with_columns(pl.col(PL_DEST_FNAME).cast(pl.Categorical))
        )

        assert_series_equal(
            expected.get_column(PL_DEST_FNAME).sort(),
            csv_df.get_column(PL_DEST_FNAME).sort(),
        )
        assert_series_equal(
            expected.get_column(PL_READ_ID).sort(),
            csv_df.get_column(PL_READ_ID).sort(),
        )

    def test_parse_csv_filters_invalid_read_ids(self, tmp_path: Path) -> None:
        csv = tmp_path / "invalid.csv"
        valid_id = "00000000-0000-0000-0000-000000000000"
        invalid_id = "not-a-uuid"
        with csv.open("w") as writer:
            writer.write(f"{tmp_path / 'valid.pod5'},{valid_id}\n")
            writer.write(f"{tmp_path / 'invalid.pod5'},{invalid_id}\n")

        parsed = parse_csv_mapping(csv).collect()

        assert parsed.height == 1
        assert parsed.get_column(PL_READ_ID).to_list() == [valid_id]
        assert parsed.get_column(PL_DEST_FNAME).to_list() == [
            str(tmp_path / "valid.pod5")
        ]

    def test_parse_table_filters_invalid_read_ids(self, tmp_path: Path) -> None:
        table = tmp_path / "table.csv"
        valid_id = "11111111-1111-1111-1111-111111111111"
        invalid_id = "1234"
        with table.open("w") as writer:
            writer.writelines(
                [
                    "sample,read_id\n",
                    f"A,{valid_id}\n",
                    f"B,{invalid_id}\n",
                ]
            )

        parsed = parse_table_mapping(table, None, ["sample"]).collect()

        assert parsed.height == 1
        assert parsed.get_column(PL_READ_ID).to_list() == [valid_id]
        assert parsed.get_column(PL_DEST_FNAME).to_list() == ["sample-A.pod5"]


================================================
FILE: python/pod5/src/tests/test_tools.py
================================================
"""
Testing Pod5 Tools
"""

import argparse
import os
from pathlib import Path
import subprocess
import sys
from typing import Callable, Dict
from unittest.mock import Mock, patch
from uuid import UUID

import h5py
import numpy as np
from pod5.tools.utils import collect_inputs, limit_threads
import pytest
import vbz_h5py_plugin  # noqa: F401

import pod5
from pod5.tools import main, parsers

TEST_DATA_PATH = Path(__file__).parent.parent.parent.parent.parent / "test_data"
FAST5_PATH = TEST_DATA_PATH / "multi_fast5_zip.fast5"
POD5_PATH = TEST_DATA_PATH / "multi_fast5_zip_v4.pod5"
SUBSET_CSV_PATH = TEST_DATA_PATH / "subset_mapping_examples/subset.csv"
READ_IDS_PATH = TEST_DATA_PATH / "subset_mapping_examples/read_ids.txt"


def assert_exit_code(func: Callable, func_kwargs: Dict, exit_code: int = 0) -> None:
    """Assert that a function returns the given SystemExit exit code"""
    try:
        func(**func_kwargs)
    except SystemExit as exc:
        assert exc.code == exit_code


class TestPod5Tools:
    """Test the Pod5 tools interface"""

    @patch("pod5.tools.main.run_tool")
    def test_main_calls_run(self, m_run_tool: Mock) -> None:
        """Assert that main calls run_tool and that it returns to main"""
        m_run_tool.return_value = "_return_value"
        return_value = main.main()
        m_run_tool.assert_called()
        assert return_value == "_return_value"

    def test_run_tool_debug_env(
        self, capsys: pytest.CaptureFixture, monkeypatch: pytest.MonkeyPatch
    ) -> None:
        """Assert that exceptions are printed nicely without POD5_DEBUG"""

        dummy_error_string = "Dummy Error String"

        def _func() -> None:
            raise Exception(dummy_error_string)

        parser = argparse.ArgumentParser()
        parser.set_defaults(func=_func)

        # Intentionally raise an error
        with monkeypatch.context() as mkp:
            mkp.setenv("POD5_DEBUG", "0")
            mkp.setattr("argparse._sys.argv", ["_raises_an_exception"])
            assert_exit_code(parsers.run_tool, {"parser": parser}, 1)

        error_str: str = capsys.readouterr().err
        assert "POD5_DEBUG=1" in error_str
        assert dummy_error_string in error_str

    def test_run_tool_raises(self, monkeypatch: pytest.MonkeyPatch) -> None:
        """Assert that exceptions are raised if POD5_DEBUG is set"""
        dummy_error_string = "Dummy Error String"

        def _func() -> None:
            raise Exception(dummy_error_string)

        parser = argparse.ArgumentParser()
        parser.set_defaults(func=_func)

        # Intentionally raise an error
        with monkeypatch.context() as mkp:
            mkp.setenv("POD5_DEBUG", "1")
            mkp.setattr("argparse._sys.argv", ["_raises_an_exception"])

            with pytest.raises(Exception, match=dummy_error_string):
                parsers.run_tool(parser)

    def test_pod5_version_argument(self, capsys: pytest.CaptureFixture) -> None:
        """Assert that pod5 has a --version argument"""
        with patch("argparse._sys.argv", ["pod5", "--version"]):
            assert_exit_code(main.main, {}, 0)

        assert f"pod5 version: {pod5.__version__}" in capsys.readouterr().out.lower()

    @pytest.mark.parametrize("subcommand", ["fast5", "to_fast5", "from_fast5"])
    def test_convert_exists(self, subcommand: str) -> None:
        """Assert that pod5 convert exists"""

        with patch("argparse._sys.argv", ["pod5", "convert", subcommand, "--help"]):
            assert_exit_code(main.main, {}, 0)

    @pytest.mark.parametrize("subcommand", ["summary", "read", "reads", "debug"])
    def test_inspect_exists(self, subcommand: str) -> None:
        """Assert that pod5 inspect exists"""

        with patch("argparse._sys.argv", ["pod5", "inspect", subcommand, "--help"]):
            assert_exit_code(main.main, {}, 0)

    @pytest.mark.parametrize(
        "command",
        ["convert", "inspect", "filter", "merge", "subset", "repack", "update"],
    )
    def test_tool_exists(self, command: str) -> None:
        """Assert that a pod5 tool exists"""

        with patch("argparse._sys.argv", ["pod5", command, "--help"]):
            assert_exit_code(main.main, {}, 0)

    def test_convert_from_fast5_runs(self, tmp_path: Path) -> None:
        """Assert that typical commands are valid"""

        args = [
            "pod5",
            "convert",
            "from_fast5",
            str(FAST5_PATH),
            "--output",
            str(tmp_path / "new.pod5"),
            "--strict",
        ]
        with patch("argparse._sys.argv", args):
            main.main()

    def test_convert_to_fast5_runs(self, tmp_path: Path) -> None:
        """Assert that typical commands are valid"""

        outdir = tmp_path / "outdir"
        args = [
            "pod5",
            "convert",
            "to_fast5",
            str(POD5_PATH),
            "--output",
            str(outdir),
        ]
        with patch("argparse._sys.argv", args):
            main.main()

        assert outdir.exists()
        fast5s = list(outdir.glob("*.fast5"))
        assert len(fast5s) > 0

        with h5py.File(fast5s[0]) as f5:
            read_id = str(list(f5.keys())[0])
            assert read_id.startswith("read_")
            assert UUID(read_id[len("read_") :])
            signal = np.array(f5[read_id]["Raw/Signal"])
            assert len(signal) > 0

    @pytest.mark.parametrize("subcommand", ["summary", "reads"])
    def test_inspect_command_runs(self, tmp_path: Path, subcommand: str) -> None:
        """Assert that typical commands are valid"""

        args = [
            "pod5",
            "inspect",
            subcommand,
            str(POD5_PATH),
        ]
        with patch("argparse._sys.argv", args):
            main.main()

    def test_inspect_read_finds_read(self, capsys: pytest.CaptureFixture) -> None:
        """Assert that inspect read finds a known read"""

        args = [
            "pod5",
            "inspect",
            "read",
            str(POD5_PATH),
            "0000173c-bf67-44e7-9a9c-1ad0bc728e74",
        ]
        with patch("argparse._sys.argv", args):
            main.main()

        stdout_lines = str(capsys.readouterr().out).splitlines()

        # A few expected lines from the tool
        assert "read_id: 0000173c-bf67-44e7-9a9c-1ad0bc728e74" in stdout_lines
        assert "read_number:\t1093" in stdout_lines
        assert "start_sample:\t4534321" in stdout_lines
        assert "median_before:\t183.1077423095703" in stdout_lines

    def test_merge_command_runs(self, tmp_path: Path) -> None:
        """Assert that typical commands are valid"""

        args = [
            "pod5",
            "merge",
            str(POD5_PATH),
            "--output",
            str(tmp_path / "new.pod5"),
        ]
        with patch("argparse._sys.argv", args):
            main.main()

    def test_repack_command_runs(self, tmp_path: Path) -> None:
        """Assert that typical commands are valid"""

        args = [
            "pod5",
            "repack",
            str(POD5_PATH),
            "--output",
            str(tmp_path / "new.pod5"),
        ]
        with patch("argparse._sys.argv", args):
            main.main()

    def test_recover_command_runs(self) -> None:
        """Assert that typical commands are valid"""

        args = [
            "pod5",
            "recover",
            str(POD5_PATH),
        ]
        with patch("argparse._sys.argv", args):
            main.main()

    def test_subset_command_runs(self, tmp_path: Path) -> None:
        """Assert that typical commands are valid"""

        output = Path(tmp_path / "test_dir")
        output.mkdir()
        args = [
            "pod5",
            "subset",
            str(POD5_PATH),
            "--output",
            str(output),
            "--csv",
            str(SUBSET_CSV_PATH),
        ]
        with patch("argparse._sys.argv", args):
            main.main()

        # assert len(list(output.rglob("*pod5"))) == 2

    def test_filter_command_runs(self, tmp_path: Path) -> None:
        """Assert that typical commands are valid"""

        args = [
            "pod5",
            "filter",
            str(POD5_PATH),
            "--output",
            str(tmp_path / "take.pod5"),
            "--ids",
            str(READ_IDS_PATH),
        ]
        with patch("argparse._sys.argv", args):
            main.main()

    def test_update_command_runs(self, tmp_path: Path) -> None:
        """Assert that typical commands are valid"""

        args = [
            "pod5",
            "update",
            str(POD5_PATH),
            "--output",
            str(tmp_path),
        ]
        with patch("argparse._sys.argv", args):
            main.main()

    def test_view_command_runs(self) -> None:
        """Assert that typical commands are valid"""

        args = [
            "pod5",
            "view",
            str(POD5_PATH),
        ]
        with patch("argparse._sys.argv", args):
            main.main()

    def test_view_command_runs_list_fields(self) -> None:
        """Assert that typical commands are valid"""

        args = [
            "pod5",
            "view",
            "--list-fields",
        ]
        with patch("argparse._sys.argv", args):
            main.main()

    @pytest.mark.skipif(
        sys.platform.startswith("win") and sys.version_info < (3, 8),
        reason="windows py3.7 pathlib concatenation issue",
    )
    @pytest.mark.parametrize(
        "script", list((Path(__file__).parent.parent / "pod5/tools").glob("pod5*.py"))
    )
    def test_scripts_run_directly(self, script: Path) -> None:
        """pod5 tools should run if executed directly as scripts"""
        python_exe = Path(sys.executable)
        subprocess.check_call([python_exe, script.absolute(), "--help"])


class TestUtils:
    def test_collect_inputs(self, tmp_path: Path) -> None:
        expected = [
            tmp_path / "a.pod5",
            tmp_path / "longer-name.pod5",
            tmp_path / "sub/a.pod5",
            tmp_path / "sub/sub2/xx.pod5",
        ]
        not_expected = [
            tmp_path / ".pod5",  # Exclude hidden files
            tmp_path / "other.txt",
            tmp_path / "pod5.p5",
            tmp_path / "a.pod5.p5",
            tmp_path / "sub/other.png",
            tmp_path / "sub/sub3/bad.pods",
        ]

        for path in expected + not_expected:
            path.parent.mkdir(parents=True, exist_ok=True)
            path.touch()

        assert all([path.exists() for path in expected + not_expected])

        # Expect all pod5s recursively
        recurse = collect_inputs([tmp_path], recursive=True, pattern="*.pod5")
        assert set(expected) == set(tmp_path.rglob("*[a-z0-9].pod5"))
        assert recurse == set(expected)
        assert set(not_expected).isdisjoint(recurse)

        # Expect all pod5s in top level
        top = collect_inputs([tmp_path], recursive=False, pattern="*.pod5")
        assert set(tmp_path.glob("*[a-z0-9].pod5")) == top
        assert set(top).isdisjoint(not_expected)

        # Files aren't duplicated in similar patterns
        dupl = collect_inputs([tmp_path], recursive=False, pattern=["*.pod5", "*d5"])
        assert dupl == top

        # Expect no matches
        assert not collect_inputs([tmp_path], recursive=True, pattern="*.none")

        # Expect file_pattern to find other than *.pod5
        p5_suffix = collect_inputs([tmp_path], recursive=True, pattern="*.p5")
        assert p5_suffix
        assert p5_suffix == set(path for path in not_expected if path.suffix == ".p5")

        expect_mixed = set([tmp_path / "other.txt", tmp_path / "sub/other.png"])
        assert expect_mixed == collect_inputs(
            [tmp_path], recursive=True, pattern=["*.txt", "*.png"]
        )

    def test_collect_inputs_non_existent(self, tmp_path: Path) -> None:
        """Test FileExistsError raised if input doesn't exist"""
        with pytest.raises(FileExistsError, match="inputs do not exist"):
            collect_inputs([tmp_path / "non_existent.txt"], False, "*.txt")

    @pytest.mark.skipif(os.cpu_count() is None, reason="os.cpu_count is None")
    def test_limit_threads(self) -> None:
        """Test thread limiting"""
        cpus = os.cpu_count()
        if cpus is None:
            assert False
        limit_threads(-1) == cpus
        limit_threads(0) == cpus
        for i in range(1, cpus + 1):
            assert limit_threads(i) == i
        assert limit_threads(cpus + 1) == cpus
        limit_threads(1_000_000) == cpus


================================================
FILE: python/pod5/src/tests/test_update.py
================================================
from pathlib import Path
import packaging.version
import pod5 as p5
from pod5.tools.pod5_update import update_pod5
import pytest


TEST_DATA_PATH = Path(__file__).parent.parent.parent.parent.parent / "test_data"
POD5_V1_PATH = TEST_DATA_PATH / "multi_fast5_zip_v1.pod5"
POD5_V2_PATH = TEST_DATA_PATH / "multi_fast5_zip_v2.pod5"
POD5_PATH = TEST_DATA_PATH / "multi_fast5_zip_v4.pod5"


class TestUpdate:
    """Test that pod5 update runs"""

    def test_detect_inplace_update(self, tmp_path: Path) -> None:
        """detect input is output and raise AssertionError"""
        example = tmp_path / "my.pod5"
        example.touch()

        with pytest.raises(AssertionError, match="in-place"):
            update_pod5([tmp_path], tmp_path, force_overwrite=False, recursive=True)

    def test_update(self, tmp_path: Path) -> None:
        """
        Test update updates files and doesn't overwrite existing files unless forced
        """
        inputs = tmp_path / "data"
        inputs.mkdir(parents=True)
        v1 = inputs / "v1.pod5"
        v1.write_bytes(POD5_V2_PATH.read_bytes())

        with p5.Reader(v1) as reader:
            assert reader.file_version_pre_migration < packaging.version.Version("0.1")

        exists = tmp_path / "v1.pod5"
        exists.touch()

        # Test no overwrite
        with pytest.raises(FileExistsError, match="--force-overwrite"):
            update_pod5(
                [inputs],
                tmp_path,
                force_overwrite=False,
                recursive=True,
            )

        update_pod5(
            [inputs],
            tmp_path,
            force_overwrite=True,
            recursive=True,
        )
        assert exists.is_file()
        with p5.Reader(exists) as reader:
            assert reader.file_version_pre_migration > packaging.version.Version("0.1")
            assert reader.read_ids


================================================
FILE: python/pod5/src/tests/test_view.py
================================================
from pathlib import Path
import random
from typing import Any, Dict
import polars as pl

import pytest

import pod5 as p5
from pod5.tools.pod5_view import (
    Field,
    assert_unique_acquisition_id,
    get_included_reads_table_fields,
    get_reads_tables,
    join_reads_to_run_info,
    parse_read_table_chunks,
    parse_reads_table_all,
    parse_run_info_table,
    view_pod5,
    select_fields,
    get_field_or_raise,
    resolve_output,
    write,
    write_header,
    FIELDS,
)


TEST_DATA_PATH = Path(__file__).parent.parent.parent.parent.parent / "test_data"
POD5_PATH = TEST_DATA_PATH / "multi_fast5_zip_v4.pod5"

ALL_FIELDS = [
    "read_id",
    "filename",
    "read_number",
    "channel",
    "mux",
    "end_reason",
    "start_time",
    "start_sample",
    "duration",
    "num_samples",
    "minknow_events",
    "sample_rate",
    "median_before",
    "predicted_scaling_scale",
    "predicted_scaling_shift",
    "tracked_scaling_scale",
    "tracked_scaling_shift",
    "num_reads_since_mux_change",
    "time_since_mux_change",
    "run_id",
    "sample_id",
    "experiment_id",
    "flow_cell_id",
    "pore_type",
    "open_pore_level",
]


class TestView:
    """Test view application"""

    def is_equal_or_not_set(self, field: str, expected: str) -> None:
        assert field == expected or (field == "" and expected == "not_set")

    def _compare(self, record: p5.ReadRecord, row: Dict[str, Any]) -> None:
        assert str(record.read_id) == row["read_id"]
        assert record.read_number == int(row["read_number"])
        assert record.pore.well == int(row["mux"])
        assert record.pore.channel == int(row["channel"])
        assert record.end_reason.name == row["end_reason"]
        assert record.start_sample / record.run_info.sample_rate == float(
            row["start_time"]
        )
        assert record.start_sample == int(row["start_sample"])
        assert record.num_samples / record.run_info.sample_rate == float(
            row["duration"]
        )
        assert record.num_samples == int(row["num_samples"])
        assert record.num_minknow_events == float(row["minknow_events"])
        assert record.run_info.sample_rate == int(row["sample_rate"])
        pytest.approx(record.median_before, float(row["median_before"]))
        pytest.approx(
            record.predicted_scaling.scale, float(row["predicted_scaling_scale"])
        )
        pytest.approx(
            record.predicted_scaling.shift, float(row["predicted_scaling_shift"])
        )
        pytest.approx(record.tracked_scaling.scale, float(row["tracked_scaling_scale"]))
        pytest.approx(record.tracked_scaling.shift, float(row["tracked_scaling_shift"]))
        assert record.num_reads_since_mux_change == int(
            row["num_reads_since_mux_change"]
        )
        pytest.approx(record.time_since_mux_change, float(row["time_since_mux_change"]))
        pytest.approx(record.open_pore_level, float(row["open_pore_level"]))
        assert record.run_info.protocol_run_id == row["run_id"]
        self.is_equal_or_not_set(record.run_info.sample_id, row["sample_id"])
        self.is_equal_or_not_set(record.run_info.experiment_name, row["experiment_id"])
        self.is_equal_or_not_set(record.run_info.flow_cell_id, row["flow_cell_id"])
        assert record.pore.pore_type == row["pore_type"]

    def test_view(self, tmp_path: Path):
        """Test that the merge tool runs a trivial example"""

        # Test all pod5 inputs in test data, which will likely contain duplicates
        output = tmp_path / "test.tsv"
        view_pod5([POD5_PATH], output)

        assert output.exists()

        with output.open("r") as _fh:
            content = _fh.readlines()

        # 10 lines + 1 header
        assert len(content) == 11

        header = content[0]
        assert list(map(str.strip, header.split("\t"))) == ALL_FIELDS

        with p5.Reader(POD5_PATH) as reader:
            for idx, record in enumerate(reader):
                items = list(map(str.strip, content[idx + 1].split("\t")))
                row = {name: items[ALL_FIELDS.index(name)] for name in ALL_FIELDS}
                POD5_PATH.name == row["filename"]

                self._compare(record, row)

            assert idx == 9

    def test_view_no_input(self, tmp_path: Path):
        """Test that the merge tool raises AssertionError if found no files"""
        with pytest.raises(AssertionError, match="Found no pod5 files"):
            view_pod5([tmp_path], tmp_path)

    def test_write_stdout(self, capsys: pytest.CaptureFixture) -> None:
        """Test that polars writes to stdout when path is None"""

        ldf = next(get_reads_tables(POD5_PATH, select_fields()))
        write_header(None, select_fields())
        write(ldf, None)
        content: str = capsys.readouterr().out
        err: str = capsys.readouterr().err
        assert not err
        lines = content.splitlines()
        header = lines[0]
        assert list(map(str.strip, header.split("\t"))) == ALL_FIELDS
        # Empty trailing line
        assert len(lines) == 11
        assert len(set(lines)) == len(lines)

    def test_is_loadable(self, tmp_path: Path) -> None:
        output = tmp_path / "test.tsv"
        view_pod5([POD5_PATH], output)

        df = pl.read_csv(output, separator="\t")
        with p5.Reader(POD5_PATH) as reader:
            for idx, record in enumerate(reader):
                row = df.row(idx, named=True)
                POD5_PATH.name == row["filename"]

                self._compare(record, row)

    def test_parse_run_info(self, pod5_factory) -> None:
        """Test the run_info table parser"""
        selection = select_fields()
        a_pod5 = pod5_factory(10)
        with p5.Reader(a_pod5) as reader:
            run_info = parse_run_info_table(reader, selection)

        assert isinstance(run_info, pl.LazyFrame)
        run_info = run_info.collect()
        assert run_info.is_unique().all()

        schema_names = run_info.collect_schema().names()
        assert "context_tags" not in schema_names
        assert "tracking_id" not in schema_names
        for run_info_field in selection.info_fields:
            assert run_info_field in schema_names

    def test_parse_reads_all(self, pod5_factory) -> None:
        """Test the reads table parser where the file is small enough to do in one go"""
        selection = select_fields()
        a_pod5 = pod5_factory(10)
        with p5.Reader(a_pod5) as reader:
            included_fields = get_included_reads_table_fields(reader, selection)
            reads = parse_reads_table_all(reader, included_fields)

        assert isinstance(reads, pl.LazyFrame)

        schema_names = reads.collect_schema().names()
        assert "read_id" in schema_names
        assert "run_info" in schema_names
        for reads_field in selection.reads_fields:
            reads_field in schema_names

        assert len(reads.collect()) == 10

    def test_parse_reads_multi_chunk(self, pod5_factory) -> None:
        """Test the reads table parser"""
        selection = select_fields()
        a_pod5 = pod5_factory(1100)
        with p5.Reader(a_pod5) as reader:
            included_fields = get_included_reads_table_fields(reader, selection)
            tables = [
                t
                for t in parse_read_table_chunks(
                    reader, included_fields, approx_size=999
                )
            ]

        assert len(tables) == 2
        for table in tables:
            assert isinstance(table, pl.LazyFrame)
            schema_names = table.collect_schema().names()
            assert "read_id" in schema_names
            assert "run_info" in schema_names
            for reads_field in selection.reads_fields:
                reads_field in schema_names

        all_reads = pl.concat(tables)
        assert len(all_reads.collect()) == 1100

    def test_unique_on_duplicated_run_info(self) -> None:
        """Legacy bug where run_info data was duplicated"""
        reads_data = {"read_id": ["a", "b", "c"], "run_info": ["r1", "r1", "r1"]}
        reads = pl.DataFrame(reads_data).lazy()

        run_info_data_dupl = {"acquisition_id": ["r1", "r1"], "data": ["d1", "d1"]}
        run_info = pl.DataFrame(run_info_data_dupl).lazy()

        assert_unique_acquisition_id(run_info, Path.cwd())
        joined = join_reads_to_run_info(reads, run_info)

        assert len(reads.collect()) == 3
        assert len(run_info.collect()) == 2
        # If len(joined) is 6, the uniqueness of run_info has failed and the
        # join operation has doubled-up every row
        assert len(joined.collect()) == 3


class TestSelection:
    """Test selection options"""

    def test_select(self) -> None:
        """Test select options"""
        assert set(ALL_FIELDS) == select_fields().selected

        assert {"read_id"} == select_fields(group_read_id=True).selected

        assert {"read_id"} == select_fields(include="read_id").selected
        assert {"read_id", "filename"} == select_fields(
            include="read_id,filename"
        ).selected
        assert {"read_id", "filename"} == select_fields(
            include=",read_id,filename,,,"
        ).selected
        assert {"read_id", "filename"} == select_fields(
            include=" read_id ,  filename "
        ).selected
        assert {"mux", "channel"} == select_fields(include=" mux,  channel").selected
        assert set(ALL_FIELDS) == select_fields(include=",".join(ALL_FIELDS)).selected
        assert set(ALL_FIELDS) == select_fields(include="").selected

        assert "read_id" not in select_fields(exclude="read_id").selected
        assert {"pore_type", "mux"} not in select_fields(
            exclude="pore_type,mux"
        ).selected
        assert set(ALL_FIELDS) == select_fields(exclude="").selected
        assert set(ALL_FIELDS) == select_fields(exclude=", ,").selected

        drop_rid = set(ALL_FIELDS) - {"read_id"}
        assert drop_rid == select_fields(exclude="read_id").selected
        assert drop_rid == select_fields(exclude=",read_id,,   ,").selected

    @pytest.mark.parametrize("field", ["read_i", "mix", "ed_reason", "_", "channell"])
    def test_misspelling(self, field: str) -> None:
        """Test select raises errors on unknown / misspelled fields"""
        with pytest.raises(KeyError, match=f"Field: '{field}' did not match"):
            select_fields(include=field)

    def test_randomly(self) -> None:
        """Randomly include / exclude"""
        for idx in range(1_000):
            random.seed(idx)
            incl = set(random.choices(ALL_FIELDS, k=random.randint(1, len(ALL_FIELDS))))
            excl = set(random.choices(ALL_FIELDS, k=random.randint(0, len(ALL_FIELDS))))

            expected = incl - excl
            include = ",".join(incl)
            exclude = ",".join(excl)
            try:
                assert (
                    expected == select_fields(include=include, exclude=exclude).selected
                )
            except RuntimeError:
                assert len(expected) == 0

    def test_get_field(self) -> None:
        """Test get_field_or_raise"""
        with pytest.raises(KeyError, match="any known fields"):
            get_field_or_raise("blah")

        with pytest.raises(KeyError, match="any known fields"):
            get_field_or_raise("")

        for field in ALL_FIELDS:
            ret = get_field_or_raise(field)
            assert isinstance(ret, Field)


class TestMisc:
    def test_resolve_output(self, tmp_path: Path) -> None:
        assert resolve_output(None, True) is None
        assert resolve_output(None, False) is None

        no_exist = tmp_path / "no_exist"
        assert resolve_output(no_exist, False) == no_exist
        assert resolve_output(no_exist, True) == no_exist

        exist = tmp_path / "exist"
        exist.touch()
        assert resolve_output(exist, True) == exist

        exist.touch()
        with pytest.raises(FileExistsError):
            resolve_output(exist, False)

        # Test the default output path if a directory is given
        assert tmp_path / "view.txt" == resolve_output(tmp_path, False)

    def test_fields(self) -> None:
        assert all(key == field for key, field in zip(ALL_FIELDS, FIELDS.keys()))
        assert len(FIELDS) > 0

    def test_unique_acquisition_id(self) -> None:
        pass_example = pl.DataFrame(
            {"acquisition_id": [1, 1, 3], "b": [1, 1, 3], "c": [2, 2, 3]}
        ).lazy()
        assert_unique_acquisition_id(pass_example, Path("none"))

        fail_example = pl.DataFrame(
            {"acquisition_id": [1, 1, 3], "b": [1, 2, 3], "c": [2, 1, 3]}
        ).lazy()
        with pytest.raises(AssertionError, match="acquisition_id"):
            assert_unique_acquisition_id(fail_example, Path("none"))


================================================
FILE: python/pod5/src/tests/test_writer.py
================================================
"""
Testing Pod5Writer
"""

import math
import lib_pod5 as p5b
import numpy as np
import pytest

import pod5 as p5


class TestPod5Writer:
    """Test the Pod5Writer from a pod5 file"""

    def test_writer_fixture(self, writer: p5.Writer) -> None:
        """Basic assertions on the writer fixture"""
        assert isinstance(writer, p5.Writer)
        assert isinstance(writer._writer, p5b.FileWriter)

    @pytest.mark.parametrize("random_read", [1, 2, 3, 4], indirect=True)
    def test_writer_random_reads(self, writer: p5.Writer, random_read: p5.Read) -> None:
        """Write some random single reads to a writer"""

        writer.add_read(random_read)

    @pytest.mark.parametrize("random_read_pre_compressed", [1], indirect=True)
    def test_writer_random_reads_compressed(
        self, writer: p5.Writer, random_read_pre_compressed: p5.Read
    ) -> None:
        """Write some random single reads to a writer which are pre-compressed"""
        writer.add_read(random_read_pre_compressed)

    def test_read_edit_write(self, reader: p5.Reader, writer: p5.Writer) -> None:
        """Read some records, edit the reads and write an edited read"""

        records = 0
        for record in reader:
            records += 1
            read = record.to_read()

            # Edit some attributes
            read.calibration = p5.Calibration(0, 1)
            read.end_reason = p5.EndReason.from_reason_with_default_forced(
                p5.EndReasonEnum.DATA_SERVICE_UNBLOCK_MUX_CHANGE
            )
            # Edit the signal
            read.signal = np.arange(0, 100, dtype=np.int16)

            # Write the edited read
            writer.add_read(read)

        writer.close()

        edited = 0
        for edited_record in p5.Reader(writer.path):
            edited += 1
            assert edited_record.calibration.offset == 0
            assert edited_record.calibration.scale == 1
            assert (
                edited_record.end_reason
                == p5.EndReason.from_reason_with_default_forced(
                    p5.EndReasonEnum.DATA_SERVICE_UNBLOCK_MUX_CHANGE
                )
            )
            assert len(edited_record.signal) == 100
            assert min(edited_record.signal) == 0
            assert max(edited_record.signal) == 99

        assert edited == records

    def test_read_copy(self, reader: p5.Reader, writer: p5.Writer) -> None:
        """Read some records, edit the reads and write an edited read"""

        records = {}
        for record in reader:
            records[record.read_id] = record
            read = record.to_read()
            writer.add_read(read)
        writer.close()

        edited = {}
        for edited_record in p5.Reader(writer.path):
            edited[edited_record.read_id] = edited_record

        assert len(records) == len(edited)
        for read_id in records.keys():
            before = records[read_id]
            after = edited[read_id]

            assert before.read_id == after.read_id
            assert before.read_number == after.read_number
            assert before.start_sample == after.start_sample
            assert before.num_samples == after.num_samples
            assert (
                all(math.isnan(x) for x in (before.median_before, after.median_before))
                or before.median_before == after.median_before
            )
            assert before.num_minknow_events == after.num_minknow_events
            assert before.tracked_scaling == after.tracked_scaling
            assert before.predicted_scaling == after.predicted_scaling
            assert before.num_reads_since_mux_change == after.num_reads_since_mux_change
            assert before.time_since_mux_change == after.time_since_mux_change
            assert before.pore == after.pore
            assert before.calibration == after.calibration
            assert before.calibration_digitisation == after.calibration_digitisation
            assert before.calibration_range == after.calibration_range
            assert before.end_reason == after.end_reason
            assert before.run_info == after.run_info
            assert before.end_reason_index == after.end_reason_index
            assert before.run_info_index == after.run_info_index
            assert before.sample_count == after.sample_count
            # assert before.byte_count == after.byte_count
            assert before.has_cached_signal == after.has_cached_signal
            assert np.array_equal(before.signal, after.signal)
            assert np.array_equal(before.signal_pa, after.signal_pa)

    def test_read_record_type_check(self, reader: p5.Reader, writer: p5.Writer) -> None:
        """Check type errors raised when passing ReadRecords to writer"""
        with pytest.raises(TypeError, match="ReadRecord.to_read"):
            for record in reader:
                writer.add_read(record)  # type: ignore

        with pytest.raises(TypeError, match="ReadRecord.to_read"):
            writer.add_reads([r for r in reader])  # type: ignore

        with pytest.raises(TypeError, match="unexpected type"):
            writer.add_read([1])  # type: ignore

        writer.close()


================================================
FILE: python/pod5/test_utils/check_pod5_files_equal.py
================================================
import argparse
import itertools
import sys
from pathlib import Path

import pod5 as p5


def main():
    parser = argparse.ArgumentParser()
    parser.add_argument("input_a", type=Path)
    parser.add_argument("input_b", type=Path)

    args = parser.parse_args()

    file_a = p5.Reader(args.input_a)
    file_b = p5.Reader(args.input_b)

    fields = [
        "read_number",
        "start_sample",
        "median_before",
        "pore",
        "calibration",
        "end_reason",
        "run_info",
    ]

    errors = 0
    read_count = 0
    for a, b in itertools.zip_longest(file_a.reads(), file_b.reads()):
        read_count += 1

        if a.read_id != b.read_id:
            print(
                f"Different reads found in file at row {read_count}: {a.read_id} vs {b.read_id}"
            )
            errors += 1

        read_id = a.read_id

        for field in fields:
            a_val = getattr(a, field)
            b_val = getattr(b, field)
            # Handle NAN specially:
            if a_val != a_val:
                if b_val == b_val:
                    print(
                        f"Read {read_id}: Field {field} not equal: {a_val} vs {b_val}"
                    )
                    errors += 1
            else:
                if a_val != b_val:
                    print(
                        f"Read {read_id}: Field {field} not equal: {a_val} vs {b_val}"
                    )
                    errors += 1

        if (a.signal != b.signal).any():
            print(
                f"Read {read_count} {read_id} signal not equal: {len(a.signal)} elements:"
                f" {a.signal} vs {len(b.signal)} elements: {b.signal}"
            )
            errors += 1

    if errors == 0:
        print("Files consistent")
        sys.exit(0)

    print("Errors detected")
    sys.exit(1)


if __name__ == "__main__":
    main()


================================================
FILE: test_data/multi_fast5_zip_v0.pod5
================================================
version https://git-lfs.github.com/spec/v1
oid sha256:9eb656f0061f1621b205b4c5f4d9694b03cad4480c66e2a2d8ea4423f53ea243
size 1321288


================================================
FILE: test_data/multi_fast5_zip_v1.pod5
================================================
version https://git-lfs.github.com/spec/v1
oid sha256:64ec14c7483a0ebb812c7b09ee52e115927a4d2f693abc1ad27c9cc548b1e770
size 1322840


================================================
FILE: test_data/multi_fast5_zip_v2.pod5
================================================
version https://git-lfs.github.com/spec/v1
oid sha256:b1cd3c85e8e2b8fdbc68c53ae8e8ca66655b95341be58abbba53353c5d7dba0a
size 1323072


================================================
FILE: test_data/multi_fast5_zip_v3.pod5
================================================
version https://git-lfs.github.com/spec/v1
oid sha256:b87153aa81a5884205b047df336a2e15e95becce6dc997a38a76b972cf6a82bc
size 1323624


================================================
FILE: test_data/multi_fast5_zip_v4.pod5
================================================
version https://git-lfs.github.com/spec/v1
oid sha256:9d0bdb7faef6ada8181eb620eb6f41256c6437680585b104fc19ee674c88d5f1
size 1323824


================================================
FILE: test_data/split_1_v4.pod5
================================================
version https://git-lfs.github.com/spec/v1
oid sha256:5fe01201db83dc57fbb8f9ee1420fdeae8bb597f8dd6a57d3602b5d3d779fc80
size 151552


================================================
FILE: test_data/split_2_v4.pod5
================================================
version https://git-lfs.github.com/spec/v1
oid sha256:900e68cb12055b38f938c440c8fec85f79be020ba7f3e147fcf6824514bc8915
size 142896


================================================
FILE: test_data/subset_mapping_examples/read_ids.txt
================================================

# empty lines and comment
# example invalid uuid hidden by comment
# 0000173c-bf67-44e7-9a9c-1ad0bc728e7a.
read_id
0000173c-bf67-44e7-9a9c-1ad0bc728e74
00925f34-6baf-47fc-b40c-22591e27fb5c
# Comment example


================================================
FILE: test_data/subset_mapping_examples/subset.csv
================================================
output_1.pod5,0000173c-bf67-44e7-9a9c-1ad0bc728e74
output_1.pod5,006d1319-2877-4b34-85df-34de7250a47b
output_2.pod5,00925f34-6baf-47fc-b40c-22591e27fb5c
output_2.pod5,009dc9bd-c5f4-487b-ba4c-b9ce7e3a711e


================================================
FILE: test_data/subset_mapping_examples/subset.summary
================================================
read_id mux barcode
0000173c-bf67-44e7-9a9c-1ad0bc728e74	1	barcode_1
006d1319-2877-4b34-85df-34de7250a47b	1	barcode_2
00925f34-6baf-47fc-b40c-22591e27fb5c	2	barcode_1
009dc9bd-c5f4-487b-ba4c-b9ce7e3a711e	2	barcode_2


================================================
FILE: test_package/CMakeLists.txt
================================================
cmake_minimum_required(VERSION 3.8)
project(test_package CXX)

# Test components
find_package(pod5_file_format REQUIRED CONFIG)
add_executable(${PROJECT_NAME} test_package.cpp test_cpp_api.cpp)

target_include_directories(${PROJECT_NAME}
    PUBLIC
        ${CMAKE_SOURCE_DIR}/../third_party/include
)

set_target_properties(${PROJECT_NAME}
    PROPERTIES
        CXX_STANDARD 20
)

target_link_libraries(${PROJECT_NAME} pod5_file_format::pod5_file_format)


================================================
FILE: test_package/conanfile.py
================================================
import os

from conan import ConanFile
from conan.tools.build import can_run
from conan.tools.cmake import cmake_layout, CMake


class TestPackageConan(ConanFile):
    settings = "os", "arch", "compiler", "build_type"
    options = {
        "compiler.sanitizer": [
            None,
            "AddressStatic",
            "ThreadStatic",
            "UndefinedBehaviorStatic",
        ]
    }
    default_options = {"compiler.sanitizer": None}
    generators = "CMakeDeps", "CMakeToolchain", "VirtualRunEnv"
    test_type = "explicit"

    def requirements(self):
        self.requires(self.tested_reference_str)

    def layout(self):
        cmake_layout(self)

    def build(self):
        cmake = CMake(self)
        cmake.configure()
        cmake.build()

    @property
    def _test_executable(self):
        return os.path.join(self.cpp.build.bindirs[0], "test_package")

    def test(self):
        if can_run(self):
            self.run(self._test_executable, env="conanrun")
        else:
            self.output.warn("Pod5Conan test: cross_building is true")


================================================
FILE: test_package/test_cpp_api.cpp
================================================
#include "pod5_format/file_writer.h"
#include "pod5_format/read_table_writer.h"
#include "pod5_format/run_info_table_writer.h"
#include "pod5_format/signal_table_writer.h"


================================================
FILE: test_package/test_package.cpp
================================================
#include "pod5_format/c_api.h"

#include <iostream>

int main()
{
    std::cout << "Initializing POD5...." << std::endl;
    if (pod5_init() == POD5_OK) {
        std::cout << "Pod5 successfully initialized." << std::endl;
    } else {
        std::cerr << "Failed to initialize Pod5!" << std::endl;
    }

    std::cout << "Shutting down POD5 gracefully...." << std::endl;
    if (pod5_terminate() == POD5_OK) {
        std::cout << "Pod5 successfully terminated." << std::endl;
    } else {
        std::cerr << "Failed to shut down Pod5!" << std::endl;
    }
}


================================================
FILE: third_party/build_instructions.txt
================================================
These instructions provide details on how to re-create the third party support libraries from source.

For each library, see software_version.yaml for download links, versions and license information.

These instructions all assume you have set the THIRD_PARTY_LIBS env var:

THIRD_PARTY_LIBS=/path/to/bass/third_party
mkdir -p $THIRD_PARTY_LIBS/include


Catch2
======

Download catch.hpp from the release and put it in $THIRD_PARTY_LIBS/include/catch2


GSL Lite
========

Download and extract tarball. From a bash prompt, cd into the directory and run:

Apply the gsl patches in $THIRD_PARTY_LIBS:
    for p in $THIRD_PARTY_LIBS/gsl-*.patch; do
        patch -Np1 -i $p
    done

Copy the headers:
    rm -rf $THIRD_PARTY_LIBS/include/gsl $THIRD_PARTY_LIBS/include/gsl.h
    cp -r include/* $THIRD_PARTY_LIBS/include/


================================================
FILE: third_party/gsl-disable-gsl-suppress.patch
================================================
--- a/include/gsl/gsl-lite.hpp
+++ b/include/gsl/gsl-lite.hpp
@@ -1081,7 +1081,7 @@ namespace __cxxabiv1 { struct __cxa_eh_globals; extern "C" __cxa_eh_globals * __
 // MSVC warning suppression macros:

 #if gsl_COMPILER_MSVC_VERSION >= 140 && ! gsl_COMPILER_NVCC_VERSION
-# define gsl_SUPPRESS_MSGSL_WARNING(expr)        [[gsl::suppress(expr)]]
+# define gsl_SUPPRESS_MSGSL_WARNING(expr)        /* Pimm: note disabled for intel [[gsl::suppress(expr)]]*/
 # define gsl_SUPPRESS_MSVC_WARNING(code, descr)  __pragma(warning(suppress: code) )
 # define gsl_DISABLE_MSVC_WARNINGS(codes)        __pragma(warning(push))  __pragma(warning(disable: codes))
 # define gsl_RESTORE_MSVC_WARNINGS()             __pragma(warning(pop ))


================================================
FILE: third_party/include/.editorconfig
================================================
# All code in this directory is third-party - don't enforce any particular settings
root = true


================================================
FILE: third_party/include/catch2/catch.hpp
================================================
/*
 *  Catch v2.13.7
 *  Generated: 2021-07-28 20:29:27.753164
 *  ----------------------------------------------------------
 *  This file has been merged from multiple headers. Please don't edit it
 * directly Copyright (c) 2021 Two Blue Cubes Ltd. All rights reserved.
 *
 *  Distributed under the Boost Software License, Version 1.0. (See accompanying
 *  file LICENSE_1_0.txt or copy at http://www.boost.org/LICENSE_1_0.txt)
 */
#ifndef TWOBLUECUBES_SINGLE_INCLUDE_CATCH_HPP_INCLUDED
#define TWOBLUECUBES_SINGLE_INCLUDE_CATCH_HPP_INCLUDED
// start catch.hpp

#define CATCH_VERSION_MAJOR 2
#define CATCH_VERSION_MINOR 13
#define CATCH_VERSION_PATCH 7

#ifdef __clang__
#pragma clang system_header
#elif defined __GNUC__
#pragma GCC system_header
#endif

// start catch_suppress_warnings.h

#ifdef __clang__
#ifdef __ICC  // icpc defines the __clang__ macro
#pragma warning(push)
#pragma warning(disable : 161 1682)
#else  // __ICC
#pragma clang diagnostic push
#pragma clang diagnostic ignored "-Wpadded"
#pragma clang diagnostic ignored "-Wswitch-enum"
#pragma clang diagnostic ignored "-Wcovered-switch-default"
#endif
#elif defined __GNUC__
// Because REQUIREs trigger GCC's -Wparentheses, and because still
// supported version of g++ have only buggy support for _Pragmas,
// Wparentheses have to be suppressed globally.
#pragma GCC diagnostic ignored "-Wparentheses"  // See #674 for details

#pragma GCC diagnostic push
#pragma GCC diagnostic ignored "-Wunused-variable"
#pragma GCC diagnostic ignored "-Wpadded"
#endif
// end catch_suppress_warnings.h
#if defined(CATCH_CONFIG_MAIN) || defined(CATCH_CONFIG_RUNNER)
#define CATCH_IMPL
#define CATCH_CONFIG_ALL_PARTS
#endif

// In the impl file, we want to have access to all parts of the headers
// Can also be used to sanely support PCHs
#if defined(CATCH_CONFIG_ALL_PARTS)
#define CATCH_CONFIG_EXTERNAL_INTERFACES
#if defined(CATCH_CONFIG_DISABLE_MATCHERS)
#undef CATCH_CONFIG_DISABLE_MATCHERS
#endif
#if !defined(CATCH_CONFIG_ENABLE_CHRONO_STRINGMAKER)
#define CATCH_CONFIG_ENABLE_CHRONO_STRINGMAKER
#endif
#endif

#if !defined(CATCH_CONFIG_IMPL_ONLY)
// start catch_platform.h

// See e.g.:
// https://opensource.apple.com/source/CarbonHeaders/CarbonHeaders-18.1/TargetConditionals.h.auto.html
#ifdef __APPLE__
#include <TargetConditionals.h>
#if (defined(TARGET_OS_OSX) && TARGET_OS_OSX == 1) || (defined(TARGET_OS_MAC) && TARGET_OS_MAC == 1)
#define CATCH_PLATFORM_MAC
#elif (defined(TARGET_OS_IPHONE) && TARGET_OS_IPHONE == 1)
#define CATCH_PLATFORM_IPHONE
#endif

#elif defined(linux) || defined(__linux) || defined(__linux__)
#define CATCH_PLATFORM_LINUX

#elif defined(WIN32) || defined(__WIN32__) || defined(_WIN32) || defined(_MSC_VER) || \
        defined(__MINGW32__)
#define CATCH_PLATFORM_WINDOWS
#endif

// end catch_platform.h

#ifdef CATCH_IMPL
#ifndef CLARA_CONFIG_MAIN
#define CLARA_CONFIG_MAIN_NOT_DEFINED
#define CLARA_CONFIG_MAIN
#endif
#endif

// start catch_user_interfaces.h

namespace Catch {
unsigned int rngSeed();
}

// end catch_user_interfaces.h
// start catch_tag_alias_autoregistrar.h

// start catch_common.h

// start catch_compiler_capabilities.h

// Detect a number of compiler features - by compiler
// The following features are defined:
//
// CATCH_CONFIG_COUNTER : is the __COUNTER__ macro supported?
// CATCH_CONFIG_WINDOWS_SEH : is Windows SEH supported?
// CATCH_CONFIG_POSIX_SIGNALS : are POSIX signals supported?
// CATCH_CONFIG_DISABLE_EXCEPTIONS : Are exceptions enabled?
// ****************
// Note to maintainers: if new toggles are added please document them
// in configuration.md, too
// ****************

// In general each macro has a _NO_<feature name> form
// (e.g. CATCH_CONFIG_NO_POSIX_SIGNALS) which disables the feature.
// Many features, at point of detection, define an _INTERNAL_ macro, so they
// can be combined, en-mass, with the _NO_ forms later.

#ifdef __cplusplus

#if (__cplusplus >= 201402L) || (defined(_MSVC_LANG) && _MSVC_LANG >= 201402L)
#define CATCH_CPP14_OR_GREATER
#endif

#if (__cplusplus >= 201703L) || (defined(_MSVC_LANG) && _MSVC_LANG >= 201703L)
#define CATCH_CPP17_OR_GREATER
#endif

#endif

// Only GCC compiler should be used in this block, so other compilers trying to
// mask themselves as GCC should be ignored.
#if defined(__GNUC__) && !defined(__clang__) && !defined(__ICC) && !defined(__CUDACC__) && \
        !defined(__LCC__)
#define CATCH_INTERNAL_START_WARNINGS_SUPPRESSION _Pragma("GCC diagnostic push")
#define CATCH_INTERNAL_STOP_WARNINGS_SUPPRESSION _Pragma("GCC diagnostic pop")

#define CATCH_INTERNAL_IGNORE_BUT_WARN(...) (void)__builtin_constant_p(__VA_ARGS__)

#endif

#if defined(__clang__)

#define CATCH_INTERNAL_START_WARNINGS_SUPPRESSION _Pragma("clang diagnostic push")
#define CATCH_INTERNAL_STOP_WARNINGS_SUPPRESSION _Pragma("clang diagnostic pop")

// As of this writing, IBM XL's implementation of __builtin_constant_p has a bug
// which results in calls to destructors being emitted for each temporary,
// without a matching initialization. In practice, this can result in something
// like `std::string::~string` being called on an uninitialized value.
//
// For example, this code will likely segfault under IBM XL:
// ```
// REQUIRE(std::string("12") + "34" == "1234")
// ```
//
// Therefore, `CATCH_INTERNAL_IGNORE_BUT_WARN` is not implemented.
#if !defined(__ibmxl__) && !defined(__CUDACC__)
#define CATCH_INTERNAL_IGNORE_BUT_WARN(...) \
    (void)__builtin_constant_p(             \
            __VA_ARGS__) /* NOLINT(cppcoreguidelines-pro-type-vararg,                \
                      hicpp-vararg) */
#endif

#define CATCH_INTERNAL_SUPPRESS_GLOBALS_WARNINGS                    \
    _Pragma("clang diagnostic ignored \"-Wexit-time-destructors\"") \
            _Pragma("clang diagnostic ignored \"-Wglobal-constructors\"")

#define CATCH_INTERNAL_SUPPRESS_PARENTHESES_WARNINGS \
    _Pragma("clang diagnostic ignored \"-Wparentheses\"")

#define CATCH_INTERNAL_SUPPRESS_UNUSED_WARNINGS \
    _Pragma("clang diagnostic ignored \"-Wunused-variable\"")

#define CATCH_INTERNAL_SUPPRESS_ZERO_VARIADIC_WARNINGS \
    _Pragma("clang diagnostic ignored \"-Wgnu-zero-variadic-macro-arguments\"")

#define CATCH_INTERNAL_SUPPRESS_UNUSED_TEMPLATE_WARNINGS \
    _Pragma("clang diagnostic ignored \"-Wunused-template\"")

#endif  // __clang__

////////////////////////////////////////////////////////////////////////////////
// Assume that non-Windows platforms support posix signals by default
#if !defined(CATCH_PLATFORM_WINDOWS)
#define CATCH_INTERNAL_CONFIG_POSIX_SIGNALS
#endif

////////////////////////////////////////////////////////////////////////////////
// We know some environments not to support full POSIX signals
#if defined(__CYGWIN__) || defined(__QNX__) || defined(__EMSCRIPTEN__) || defined(__DJGPP__)
#define CATCH_INTERNAL_CONFIG_NO_POSIX_SIGNALS
#endif

#ifdef __OS400__
#define CATCH_INTERNAL_CONFIG_NO_POSIX_SIGNALS
#define CATCH_CONFIG_COLOUR_NONE
#endif

////////////////////////////////////////////////////////////////////////////////
// Android somehow still does not support std::to_string
#if defined(__ANDROID__)
#define CATCH_INTERNAL_CONFIG_NO_CPP11_TO_STRING
#define CATCH_INTERNAL_CONFIG_ANDROID_LOGWRITE
#endif

////////////////////////////////////////////////////////////////////////////////
// Not all Windows environments support SEH properly
#if defined(__MINGW32__)
#define CATCH_INTERNAL_CONFIG_NO_WINDOWS_SEH
#endif

////////////////////////////////////////////////////////////////////////////////
// PS4
#if defined(__ORBIS__)
#define CATCH_INTERNAL_CONFIG_NO_NEW_CAPTURE
#endif

////////////////////////////////////////////////////////////////////////////////
// Cygwin
#ifdef __CYGWIN__

// Required for some versions of Cygwin to declare gettimeofday
// see:
// http://stackoverflow.com/questions/36901803/gettimeofday-not-declared-in-this-scope-cygwin
#define _BSD_SOURCE
// some versions of cygwin (most) do not support std::to_string. Use the libstd
// check.
// https://gcc.gnu.org/onlinedocs/gcc-4.8.2/libstdc++/api/a01053_source.html
// line 2812-2813
#if !((__cplusplus >= 201103L) && defined(_GLIBCXX_USE_C99) && \
      !defined(_GLIBCXX_HAVE_BROKEN_VSWPRINTF))

#define CATCH_INTERNAL_CONFIG_NO_CPP11_TO_STRING

#endif
#endif  // __CYGWIN__

////////////////////////////////////////////////////////////////////////////////
// Visual C++
#if defined(_MSC_VER)

#define CATCH_INTERNAL_START_WARNINGS_SUPPRESSION __pragma(warning(push))
#define CATCH_INTERNAL_STOP_WARNINGS_SUPPRESSION __pragma(warning(pop))

// Universal Windows platform does not support SEH
// Or console colours (or console at all...)
#if defined(WINAPI_FAMILY) && (WINAPI_FAMILY == WINAPI_FAMILY_APP)
#define CATCH_CONFIG_COLOUR_NONE
#else
#define CATCH_INTERNAL_CONFIG_WINDOWS_SEH
#endif

// MSVC traditional preprocessor needs some workaround for __VA_ARGS__
// _MSVC_TRADITIONAL == 0 means new conformant preprocessor
// _MSVC_TRADITIONAL == 1 means old traditional non-conformant preprocessor
#if !defined(__clang__)  // Handle Clang masquerading for msvc
#if !defined(_MSVC_TRADITIONAL) || (defined(_MSVC_TRADITIONAL) && _MSVC_TRADITIONAL)
#define CATCH_INTERNAL_CONFIG_TRADITIONAL_MSVC_PREPROCESSOR
#endif  // MSVC_TRADITIONAL
#endif  // __clang__

#endif  // _MSC_VER

#if defined(_REENTRANT) || defined(_MSC_VER)
// Enable async processing, as -pthread is specified or no additional linking is
// required
#define CATCH_INTERNAL_CONFIG_USE_ASYNC
#endif  // _MSC_VER

////////////////////////////////////////////////////////////////////////////////
// Check if we are compiled with -fno-exceptions or equivalent
#if defined(__EXCEPTIONS) || defined(__cpp_exceptions) || defined(_CPPUNWIND)
#define CATCH_INTERNAL_CONFIG_EXCEPTIONS_ENABLED
#endif

////////////////////////////////////////////////////////////////////////////////
// DJGPP
#ifdef __DJGPP__
#define CATCH_INTERNAL_CONFIG_NO_WCHAR
#endif  // __DJGPP__

////////////////////////////////////////////////////////////////////////////////
// Embarcadero C++Build
#if defined(__BORLANDC__)
#define CATCH_INTERNAL_CONFIG_POLYFILL_ISNAN
#endif

////////////////////////////////////////////////////////////////////////////////

// Use of __COUNTER__ is suppressed during code analysis in
// CLion/AppCode 2017.2.x and former, because __COUNTER__ is not properly
// handled by it.
// Otherwise all supported compilers support COUNTER macro,
// but user still might want to turn it off
#if (!defined(__JETBRAINS_IDE__) || __JETBRAINS_IDE__ >= 20170300L)
#define CATCH_INTERNAL_CONFIG_COUNTER
#endif

////////////////////////////////////////////////////////////////////////////////

// RTX is a special version of Windows that is real time.
// This means that it is detected as Windows, but does not provide
// the same set of capabilities as real Windows does.
#if defined(UNDER_RTSS) || defined(RTX64_BUILD)
#define CATCH_INTERNAL_CONFIG_NO_WINDOWS_SEH
#define CATCH_INTERNAL_CONFIG_NO_ASYNC
#define CATCH_CONFIG_COLOUR_NONE
#endif

#if !defined(_GLIBCXX_USE_C99_MATH_TR1)
#define CATCH_INTERNAL_CONFIG_GLOBAL_NEXTAFTER
#endif

// Various stdlib support checks that require __has_include
#if defined(__has_include)
// Check if string_view is available and usable
#if __has_include(<string_view>) && defined(CATCH_CPP17_OR_GREATER)
#define CATCH_INTERNAL_CONFIG_CPP17_STRING_VIEW
#endif

// Check if optional is available and usable
#if __has_include(<optional>) && defined(CATCH_CPP17_OR_GREATER)
#define CATCH_INTERNAL_CONFIG_CPP17_OPTIONAL
#endif  // __has_include(<optional>) && defined(CATCH_CPP17_OR_GREATER)

// Check if byte is available and usable
#if __has_include(<cstddef>) && defined(CATCH_CPP17_OR_GREATER)
#include <cstddef>
#if defined(__cpp_lib_byte) && (__cpp_lib_byte > 0)
#define CATCH_INTERNAL_CONFIG_CPP17_BYTE
#endif
#endif  // __has_include(<cstddef>) && defined(CATCH_CPP17_OR_GREATER)

// Check if variant is available and usable
#if __has_include(<variant>) && defined(CATCH_CPP17_OR_GREATER)
#if defined(__clang__) && (__clang_major__ < 8)
// work around clang bug with libstdc++
// https://bugs.llvm.org/show_bug.cgi?id=31852 fix should be in clang 8,
// workaround in libstdc++ 8.2
#include <ciso646>
#if defined(__GLIBCXX__) && defined(_GLIBCXX_RELEASE) && (_GLIBCXX_RELEASE < 9)
#define CATCH_CONFIG_NO_CPP17_VARIANT
#else
#define CATCH_INTERNAL_CONFIG_CPP17_VARIANT
#endif  // defined(__GLIBCXX__) && defined(_GLIBCXX_RELEASE) && (_GLIBCXX_RELEASE \
        // < 9)
#else
#define CATCH_INTERNAL_CONFIG_CPP17_VARIANT
#endif  // defined(__clang__) && (__clang_major__ < 8)
#endif  // __has_include(<variant>) && defined(CATCH_CPP17_OR_GREATER)
#endif  // defined(__has_include)

#if defined(CATCH_INTERNAL_CONFIG_COUNTER) && !defined(CATCH_CONFIG_NO_COUNTER) && \
        !defined(CATCH_CONFIG_COUNTER)
#define CATCH_CONFIG_COUNTER
#endif
#if defined(CATCH_INTERNAL_CONFIG_WINDOWS_SEH) && !defined(CATCH_CONFIG_NO_WINDOWS_SEH) && \
        !defined(CATCH_CONFIG_WINDOWS_SEH) && !defined(CATCH_INTERNAL_CONFIG_NO_WINDOWS_SEH)
#define CATCH_CONFIG_WINDOWS_SEH
#endif
// This is set by default, because we assume that unix compilers are
// posix-signal-compatible by default.
#if defined(CATCH_INTERNAL_CONFIG_POSIX_SIGNALS) &&         \
        !defined(CATCH_INTERNAL_CONFIG_NO_POSIX_SIGNALS) && \
        !defined(CATCH_CONFIG_NO_POSIX_SIGNALS) && !defined(CATCH_CONFIG_POSIX_SIGNALS)
#define CATCH_CONFIG_POSIX_SIGNALS
#endif
// This is set by default, because we assume that compilers with no wchar_t
// support are just rare exceptions.
#if !defined(CATCH_INTERNAL_CONFIG_NO_WCHAR) && !defined(CATCH_CONFIG_NO_WCHAR) && \
        !defined(CATCH_CONFIG_WCHAR)
#define CATCH_CONFIG_WCHAR
#endif

#if !defined(CATCH_INTERNAL_CONFIG_NO_CPP11_TO_STRING) && \
        !defined(CATCH_CONFIG_NO_CPP11_TO_STRING) && !defined(CATCH_CONFIG_CPP11_TO_STRING)
#define CATCH_CONFIG_CPP11_TO_STRING
#endif

#if defined(CATCH_INTERNAL_CONFIG_CPP17_OPTIONAL) && !defined(CATCH_CONFIG_NO_CPP17_OPTIONAL) && \
        !defined(CATCH_CONFIG_CPP17_OPTIONAL)
#define CATCH_CONFIG_CPP17_OPTIONAL
#endif

#if defined(CATCH_INTERNAL_CONFIG_CPP17_STRING_VIEW) && \
        !defined(CATCH_CONFIG_NO_CPP17_STRING_VIEW) && !defined(CATCH_CONFIG_CPP17_STRING_VIEW)
#define CATCH_CONFIG_CPP17_STRING_VIEW
#endif

#if defined(CATCH_INTERNAL_CONFIG_CPP17_VARIANT) && !defined(CATCH_CONFIG_NO_CPP17_VARIANT) && \
        !defined(CATCH_CONFIG_CPP17_VARIANT)
#define CATCH_CONFIG_CPP17_VARIANT
#endif

#if defined(CATCH_INTERNAL_CONFIG_CPP17_BYTE) && !defined(CATCH_CONFIG_NO_CPP17_BYTE) && \
        !defined(CATCH_CONFIG_CPP17_BYTE)
#define CATCH_CONFIG_CPP17_BYTE
#endif

#if defined(CATCH_CONFIG_EXPERIMENTAL_REDIRECT)
#define CATCH_INTERNAL_CONFIG_NEW_CAPTURE
#endif

#if defined(CATCH_INTERNAL_CONFIG_NEW_CAPTURE) &&                                                  \
        !defined(CATCH_INTERNAL_CONFIG_NO_NEW_CAPTURE) && !defined(CATCH_CONFIG_NO_NEW_CAPTURE) && \
        !defined(CATCH_CONFIG_NEW_CAPTURE)
#define CATCH_CONFIG_NEW_CAPTURE
#endif

#if !defined(CATCH_INTERNAL_CONFIG_EXCEPTIONS_ENABLED) && !defined(CATCH_CONFIG_DISABLE_EXCEPTIONS)
#define CATCH_CONFIG_DISABLE_EXCEPTIONS
#endif

#if defined(CATCH_INTERNAL_CONFIG_POLYFILL_ISNAN) && !defined(CATCH_CONFIG_NO_POLYFILL_ISNAN) && \
        !defined(CATCH_CONFIG_POLYFILL_ISNAN)
#define CATCH_CONFIG_POLYFILL_ISNAN
#endif

#if defined(CATCH_INTERNAL_CONFIG_USE_ASYNC) && !defined(CATCH_INTERNAL_CONFIG_NO_ASYNC) && \
        !defined(CATCH_CONFIG_NO_USE_ASYNC) && !defined(CATCH_CONFIG_USE_ASYNC)
#define CATCH_CONFIG_USE_ASYNC
#endif

#if defined(CATCH_INTERNAL_CONFIG_ANDROID_LOGWRITE) && \
        !defined(CATCH_CONFIG_NO_ANDROID_LOGWRITE) && !defined(CATCH_CONFIG_ANDROID_LOGWRITE)
#define CATCH_CONFIG_ANDROID_LOGWRITE
#endif

#if defined(CATCH_INTERNAL_CONFIG_GLOBAL_NEXTAFTER) && \
        !defined(CATCH_CONFIG_NO_GLOBAL_NEXTAFTER) && !defined(CATCH_CONFIG_GLOBAL_NEXTAFTER)
#define CATCH_CONFIG_GLOBAL_NEXTAFTER
#endif

// Even if we do not think the compiler has that warning, we still have
// to provide a macro that can be used by the code.
#if !defined(CATCH_INTERNAL_START_WARNINGS_SUPPRESSION)
#define CATCH_INTERNAL_START_WARNINGS_SUPPRESSION
#endif
#if !defined(CATCH_INTERNAL_STOP_WARNINGS_SUPPRESSION)
#define CATCH_INTERNAL_STOP_WARNINGS_SUPPRESSION
#endif
#if !defined(CATCH_INTERNAL_SUPPRESS_PARENTHESES_WARNINGS)
#define CATCH_INTERNAL_SUPPRESS_PARENTHESES_WARNINGS
#endif
#if !defined(CATCH_INTERNAL_SUPPRESS_GLOBALS_WARNINGS)
#define CATCH_INTERNAL_SUPPRESS_GLOBALS_WARNINGS
#endif
#if !defined(CATCH_INTERNAL_SUPPRESS_UNUSED_WARNINGS)
#define CATCH_INTERNAL_SUPPRESS_UNUSED_WARNINGS
#endif
#if !defined(CATCH_INTERNAL_SUPPRESS_ZERO_VARIADIC_WARNINGS)
#define CATCH_INTERNAL_SUPPRESS_ZERO_VARIADIC_WARNINGS
#endif

// The goal of this macro is to avoid evaluation of the arguments, but
// still have the compiler warn on problems inside...
#if !defined(CATCH_INTERNAL_IGNORE_BUT_WARN)
#define CATCH_INTERNAL_IGNORE_BUT_WARN(...)
#endif

#if defined(__APPLE__) && defined(__apple_build_version__) && (__clang_major__ < 10)
#undef CATCH_INTERNAL_SUPPRESS_UNUSED_TEMPLATE_WARNINGS
#elif defined(__clang__) && (__clang_major__ < 5)
#undef CATCH_INTERNAL_SUPPRESS_UNUSED_TEMPLATE_WARNINGS
#endif

#if !defined(CATCH_INTERNAL_SUPPRESS_UNUSED_TEMPLATE_WARNINGS)
#define CATCH_INTERNAL_SUPPRESS_UNUSED_TEMPLATE_WARNINGS
#endif

#if defined(CATCH_CONFIG_DISABLE_EXCEPTIONS)
#define CATCH_TRY if ((true))
#define CATCH_CATCH_ALL if ((false))
#define CATCH_CATCH_ANON(type) if ((false))
#else
#define CATCH_TRY try
#define CATCH_CATCH_ALL catch (...)
#define CATCH_CATCH_ANON(type) catch (type)
#endif

#if defined(CATCH_INTERNAL_CONFIG_TRADITIONAL_MSVC_PREPROCESSOR) && \
        !defined(CATCH_CONFIG_NO_TRADITIONAL_MSVC_PREPROCESSOR) &&  \
        !defined(CATCH_CONFIG_TRADITIONAL_MSVC_PREPROCESSOR)
#define CATCH_CONFIG_TRADITIONAL_MSVC_PREPROCESSOR
#endif

// end catch_compiler_capabilities.h
#define INTERNAL_CATCH_UNIQUE_NAME_LINE2(name, line) name##line
#define INTERNAL_CATCH_UNIQUE_NAME_LINE(name, line) INTERNAL_CATCH_UNIQUE_NAME_LINE2(name, line)
#ifdef CATCH_CONFIG_COUNTER
#define INTERNAL_CATCH_UNIQUE_NAME(name) INTERNAL_CATCH_UNIQUE_NAME_LINE(name, __COUNTER__)
#else
#define INTERNAL_CATCH_UNIQUE_NAME(name) INTERNAL_CATCH_UNIQUE_NAME_LINE(name, __LINE__)
#endif

#include <cstdint>
#include <iosfwd>
#include <string>

// We need a dummy global operator<< so we can bring it into Catch namespace
// later
struct Catch_global_namespace_dummy {};
std::ostream &operator<<(std::ostream &, Catch_global_namespace_dummy);

namespace Catch {

struct CaseSensitive {
    enum Choice { Yes, No };
};

class NonCopyable {
    NonCopyable(NonCopyable const &) = delete;
    NonCopyable(NonCopyable &&) = delete;
    NonCopyable &operator=(NonCopyable const &) = delete;
    NonCopyable &operator=(NonCopyable &&) = delete;

protected:
    NonCopyable();
    virtual ~NonCopyable();
};

struct SourceLineInfo {
    SourceLineInfo() = delete;
    SourceLineInfo(char const *_file, std::size_t _line) noexcept : file(_file), line(_line) {}

    SourceLineInfo(SourceLineInfo const &other) = default;
    SourceLineInfo &operator=(SourceLineInfo const &) = default;
    SourceLineInfo(SourceLineInfo &&) noexcept = default;
    SourceLineInfo &operator=(SourceLineInfo &&) noexcept = default;

    bool empty() const noexcept { return file[0] == '\0'; }
    bool operator==(SourceLineInfo const &other) const noexcept;
    bool operator<(SourceLineInfo const &other) const noexcept;

    char const *file;
    std::size_t line;
};

std::ostream &operator<<(std::ostream &os, SourceLineInfo const &info);

// Bring in operator<< from global namespace into Catch namespace
// This is necessary because the overload of operator<< above makes
// lookup stop at namespace Catch
using ::operator<<;

// Use this in variadic streaming macros to allow
//    >> +StreamEndStop
// as well as
//    >> stuff +StreamEndStop
struct StreamEndStop {
    std::string operator+() const;
};
template <typename T>
T const &operator+(T const &value, StreamEndStop) {
    return value;
}
}  // namespace Catch

#define CATCH_INTERNAL_LINEINFO \
    ::Catch::SourceLineInfo(__FILE__, static_cast<std::size_t>(__LINE__))

// end catch_common.h
namespace Catch {

struct RegistrarForTagAliases {
    RegistrarForTagAliases(char const *alias, char const *tag, SourceLineInfo const &lineInfo);
};

}  // end namespace Catch

#define CATCH_REGISTER_TAG_ALIAS(alias, spec)                            \
    CATCH_INTERNAL_START_WARNINGS_SUPPRESSION                            \
    CATCH_INTERNAL_SUPPRESS_GLOBALS_WARNINGS                             \
    namespace {                                                          \
    Catch::RegistrarForTagAliases INTERNAL_CATCH_UNIQUE_NAME(            \
            AutoRegisterTagAlias)(alias, spec, CATCH_INTERNAL_LINEINFO); \
    }                                                                    \
    CATCH_INTERNAL_STOP_WARNINGS_SUPPRESSION

// end catch_tag_alias_autoregistrar.h
// start catch_test_registry.h

// start catch_interfaces_testcase.h

#include <vector>

namespace Catch {

class TestSpec;

struct ITestInvoker {
    virtual void invoke() const = 0;
    virtual ~ITestInvoker();
};

class TestCase;
struct IConfig;

struct ITestCaseRegistry {
    virtual ~ITestCaseRegistry();
    virtual std::vector<TestCase> const &getAllTests() const = 0;
    virtual std::vector<TestCase> const &getAllTestsSorted(IConfig const &config) const = 0;
};

bool isThrowSafe(TestCase const &testCase, IConfig const &config);
bool matchTest(TestCase const &testCase, TestSpec const &testSpec, IConfig const &config);
std::vector<TestCase> filterTests(std::vector<TestCase> const &testCases,
                                  TestSpec const &testSpec,
                                  IConfig const &config);
std::vector<TestCase> const &getAllTestCasesSorted(IConfig const &config);

}  // namespace Catch

// end catch_interfaces_testcase.h
// start catch_stringref.h

#include <cassert>
#include <cstddef>
#include <iosfwd>
#include <string>

namespace Catch {

/// A non-owning string class (similar to the forthcoming std::string_view)
/// Note that, because a StringRef may be a substring of another string,
/// it may not be null terminated.
class StringRef {
public:
    using size_type = std::size_t;
    using const_iterator = const char *;

private:
    static constexpr char const *const s_empty = "";

    char const *m_start = s_empty;
    size_type m_size = 0;

public:  // construction
    constexpr StringRef() noexcept = default;

    StringRef(char const *rawChars) noexcept;

    constexpr StringRef(char const *rawChars, size_type size) noexcept
            : m_start(rawChars), m_size(size) {}

    StringRef(std::string const &stdString) noexcept
            : m_start(stdString.c_str()), m_size(stdString.size()) {}

    explicit operator std::string() const { return std::string(m_start, m_size); }

public:  // operators
    auto operator==(StringRef const &other) const noexcept -> bool;
    auto operator!=(StringRef const &other) const noexcept -> bool { return !(*this == other); }

    auto operator[](size_type index) const noexcept -> char {
        assert(index < m_size);
        return m_start[index];
    }

public:  // named queries
    constexpr auto empty() const noexcept -> bool { return m_size == 0; }
    constexpr auto size() const noexcept -> size_type { return m_size; }

    // Returns the current start pointer. If the StringRef is not
    // null-terminated, throws std::domain_exception
    auto c_str() const -> char const *;

public:  // substrings and searches
    // Returns a substring of [start, start + length).
    // If start + length > size(), then the substring is [start, size()).
    // If start > size(), then the substring is empty.
    auto substr(size_type start, size_type length) const noexcept -> StringRef;

    // Returns the current start pointer. May not be null-terminated.
    auto data() const noexcept -> char const *;

    constexpr auto isNullTerminated() const noexcept -> bool { return m_start[m_size] == '\0'; }

public:  // iterators
    constexpr const_iterator begin() const { return m_start; }
    constexpr const_iterator end() const { return m_start + m_size; }
};

auto operator+=(std::string &lhs, StringRef const &sr) -> std::string &;
auto operator<<(std::ostream &os, StringRef const &sr) -> std::ostream &;

constexpr auto operator"" _sr(char const *rawChars, std::size_t size) noexcept -> StringRef {
    return StringRef(rawChars, size);
}
}  // namespace Catch

constexpr auto operator"" _catch_sr(char const *rawChars, std::size_t size) noexcept
        -> Catch::StringRef {
    return Catch::StringRef(rawChars, size);
}

// end catch_stringref.h
// start catch_preprocessor.hpp

#define CATCH_RECURSION_LEVEL0(...) __VA_ARGS__
#define CATCH_RECURSION_LEVEL1(...) \
    CATCH_RECURSION_LEVEL0(CATCH_RECURSION_LEVEL0(CATCH_RECURSION_LEVEL0(__VA_ARGS__)))
#define CATCH_RECURSION_LEVEL2(...) \
    CATCH_RECURSION_LEVEL1(CATCH_RECURSION_LEVEL1(CATCH_RECURSION_LEVEL1(__VA_ARGS__)))
#define CATCH_RECURSION_LEVEL3(...) \
    CATCH_RECURSION_LEVEL2(CATCH_RECURSION_LEVEL2(CATCH_RECURSION_LEVEL2(__VA_ARGS__)))
#define CATCH_RECURSION_LEVEL4(...) \
    CATCH_RECURSION_LEVEL3(CATCH_RECURSION_LEVEL3(CATCH_RECURSION_LEVEL3(__VA_ARGS__)))
#define CATCH_RECURSION_LEVEL5(...) \
    CATCH_RECURSION_LEVEL4(CATCH_RECURSION_LEVEL4(CATCH_RECURSION_LEVEL4(__VA_ARGS__)))

#ifdef CATCH_CONFIG_TRADITIONAL_MSVC_PREPROCESSOR
#define INTERNAL_CATCH_EXPAND_VARGS(...) __VA_ARGS__
// MSVC needs more evaluations
#define CATCH_RECURSION_LEVEL6(...) \
    CATCH_RECURSION_LEVEL5(CATCH_RECURSION_LEVEL5(CATCH_RECURSION_LEVEL5(__VA_ARGS__)))
#define CATCH_RECURSE(...) CATCH_RECURSION_LEVEL6(CATCH_RECURSION_LEVEL6(__VA_ARGS__))
#else
#define CATCH_RECURSE(...) CATCH_RECURSION_LEVEL5(__VA_ARGS__)
#endif

#define CATCH_REC_END(...)
#define CATCH_REC_OUT

#define CATCH_EMPTY()
#define CATCH_DEFER(id) id CATCH_EMPTY()

#define CATCH_REC_GET_END2() 0, CATCH_REC_END
#define CATCH_REC_GET_END1(...) CATCH_REC_GET_END2
#define CATCH_REC_GET_END(...) CATCH_REC_GET_END1
#define CATCH_REC_NEXT0(test, next, ...) next CATCH_REC_OUT
#define CATCH_REC_NEXT1(test, next) CATCH_DEFER(CATCH_REC_NEXT0)(test, next, 0)
#define CATCH_REC_NEXT(test, next) CATCH_REC_NEXT1(CATCH_REC_GET_END test, next)

#define CATCH_REC_LIST0(f, x, peek, ...) \
    , f(x) CATCH_DEFER(CATCH_REC_NEXT(peek, CATCH_REC_LIST1))(f, peek, __VA_ARGS__)
#define CATCH_REC_LIST1(f, x, peek, ...) \
    , f(x) CATCH_DEFER(CATCH_REC_NEXT(peek, CATCH_REC_LIST0))(f, peek, __VA_ARGS__)
#define CATCH_REC_LIST2(f, x, peek, ...) \
    f(x) CATCH_DEFER(CATCH_REC_NEXT(peek, CATCH_REC_LIST1))(f, peek, __VA_ARGS__)

#define CATCH_REC_LIST0_UD(f, userdata, x, peek, ...)                                         \
    , f(userdata, x) CATCH_DEFER(CATCH_REC_NEXT(peek, CATCH_REC_LIST1_UD))(f, userdata, peek, \
                                                                           __VA_ARGS__)
#define CATCH_REC_LIST1_UD(f, userdata, x, peek, ...)                                         \
    , f(userdata, x) CATCH_DEFER(CATCH_REC_NEXT(peek, CATCH_REC_LIST0_UD))(f, userdata, peek, \
                                                                           __VA_ARGS__)
#define CATCH_REC_LIST2_UD(f, userdata, x, peek, ...) \
    f(userdata, x)                                    \
            CATCH_DEFER(CATCH_REC_NEXT(peek, CATCH_REC_LIST1_UD))(f, userdata, peek, __VA_ARGS__)

// Applies the function macro `f` to each of the remaining parameters, inserts
// commas between the results, and passes userdata as the first parameter to
// each invocation, e.g. CATCH_REC_LIST_UD(f, x, a, b, c) evaluates to f(x, a),
// f(x, b), f(x, c)
#define CATCH_REC_LIST_UD(f, userdata, ...) \
    CATCH_RECURSE(CATCH_REC_LIST2_UD(f, userdata, __VA_ARGS__, ()()(), ()()(), ()()(), 0))

#define CATCH_REC_LIST(f, ...) \
    CATCH_RECURSE(CATCH_REC_LIST2(f, __VA_ARGS__, ()()(), ()()(), ()()(), 0))

#define INTERNAL_CATCH_EXPAND1(param) INTERNAL_CATCH_EXPAND2(param)
#define INTERNAL_CATCH_EXPAND2(...) INTERNAL_CATCH_NO##__VA_ARGS__
#define INTERNAL_CATCH_DEF(...) INTERNAL_CATCH_DEF __VA_ARGS__
#define INTERNAL_CATCH_NOINTERNAL_CATCH_DEF
#define INTERNAL_CATCH_STRINGIZE(...) INTERNAL_CATCH_STRINGIZE2(__VA_ARGS__)
#ifndef CATCH_CONFIG_TRADITIONAL_MSVC_PREPROCESSOR
#define INTERNAL_CATCH_STRINGIZE2(...) #__VA_ARGS__
#define INTERNAL_CATCH_STRINGIZE_WITHOUT_PARENS(param) \
    INTERNAL_CATCH_STRINGIZE(INTERNAL_CATCH_REMOVE_PARENS(param))
#else
// MSVC is adding extra space and needs another indirection to expand
// INTERNAL_CATCH_NOINTERNAL_CATCH_DEF
#define INTERNAL_CATCH_STRINGIZE2(...) INTERNAL_CATCH_STRINGIZE3(__VA_ARGS__)
#define INTERNAL_CATCH_STRINGIZE3(...) #__VA_ARGS__
#define INTERNAL_CATCH_STRINGIZE_WITHOUT_PARENS(param) \
    (INTERNAL_CATCH_STRINGIZE(INTERNAL_CATCH_REMOVE_PARENS(param)) + 1)
#endif

#define INTERNAL_CATCH_MAKE_NAMESPACE2(...) ns_##__VA_ARGS__
#define INTERNAL_CATCH_MAKE_NAMESPACE(name) INTERNAL_CATCH_MAKE_NAMESPACE2(name)

#define INTERNAL_CATCH_REMOVE_PARENS(...) INTERNAL_CATCH_EXPAND1(INTERNAL_CATCH_DEF __VA_ARGS__)

#ifndef CATCH_CONFIG_TRADITIONAL_MSVC_PREPROCESSOR
#define INTERNAL_CATCH_MAKE_TYPE_LIST2(...) \
    decltype(get_wrapper<INTERNAL_CATCH_REMOVE_PARENS_GEN(__VA_ARGS__)>())
#define INTERNAL_CATCH_MAKE_TYPE_LIST(...) \
    INTERNAL_CATCH_MAKE_TYPE_LIST2(INTERNAL_CATCH_REMOVE_PARENS(__VA_ARGS__))
#else
#define INTERNAL_CATCH_MAKE_TYPE_LIST2(...) \
    INTERNAL_CATCH_EXPAND_VARGS(            \
            decltype(get_wrapper<INTERNAL_CATCH_REMOVE_PARENS_GEN(__VA_ARGS__)>()))
#define INTERNAL_CATCH_MAKE_TYPE_LIST(...) \
    INTERNAL_CATCH_EXPAND_VARGS(           \
            INTERNAL_CATCH_MAKE_TYPE_LIST2(INTERNAL_CATCH_REMOVE_PARENS(__VA_ARGS__)))
#endif

#define INTERNAL_CATCH_MAKE_TYPE_LISTS_FROM_TYPES(...) \
    CATCH_REC_LIST(INTERNAL_CATCH_MAKE_TYPE_LIST, __VA_ARGS__)

#define INTERNAL_CATCH_REMOVE_PARENS_1_ARG(_0) INTERNAL_CATCH_REMOVE_PARENS(_0)
#define INTERNAL_CATCH_REMOVE_PARENS_2_ARG(_0, _1) \
    INTERNAL_CATCH_REMOVE_PARENS(_0), INTERNAL_CATCH_REMOVE_PARENS_1_ARG(_1)
#define INTERNAL_CATCH_REMOVE_PARENS_3_ARG(_0, _1, _2) \
    INTERNAL_CATCH_REMOVE_PARENS(_0), INTERNAL_CATCH_REMOVE_PARENS_2_ARG(_1, _2)
#define INTERNAL_CATCH_REMOVE_PARENS_4_ARG(_0, _1, _2, _3) \
    INTERNAL_CATCH_REMOVE_PARENS(_0), INTERNAL_CATCH_REMOVE_PARENS_3_ARG(_1, _2, _3)
#define INTERNAL_CATCH_REMOVE_PARENS_5_ARG(_0, _1, _2, _3, _4) \
    INTERNAL_CATCH_REMOVE_PARENS(_0), INTERNAL_CATCH_REMOVE_PARENS_4_ARG(_1, _2, _3, _4)
#define INTERNAL_CATCH_REMOVE_PARENS_6_ARG(_0, _1, _2, _3, _4, _5) \
    INTERNAL_CATCH_REMOVE_PARENS(_0), INTERNAL_CATCH_REMOVE_PARENS_5_ARG(_1, _2, _3, _4, _5)
#define INTERNAL_CATCH_REMOVE_PARENS_7_ARG(_0, _1, _2, _3, _4, _5, _6) \
    INTERNAL_CATCH_REMOVE_PARENS(_0), INTERNAL_CATCH_REMOVE_PARENS_6_ARG(_1, _2, _3, _4, _5, _6)
#define INTERNAL_CATCH_REMOVE_PARENS_8_ARG(_0, _1, _2, _3, _4, _5, _6, _7) \
    INTERNAL_CATCH_REMOVE_PARENS(_0), INTERNAL_CATCH_REMOVE_PARENS_7_ARG(_1, _2, _3, _4, _5, _6, _7)
#define INTERNAL_CATCH_REMOVE_PARENS_9_ARG(_0, _1, _2, _3, _4, _5, _6, _7, _8) \
    INTERNAL_CATCH_REMOVE_PARENS(_0),                                          \
            INTERNAL_CATCH_REMOVE_PARENS_8_ARG(_1, _2, _3, _4, _5, _6, _7, _8)
#define INTERNAL_CATCH_REMOVE_PARENS_10_ARG(_0, _1, _2, _3, _4, _5, _6, _7, _8, _9) \
    INTERNAL_CATCH_REMOVE_PARENS(_0),                                               \
            INTERNAL_CATCH_REMOVE_PARENS_9_ARG(_1, _2, _3, _4, _5, _6, _7, _8, _9)
#define INTERNAL_CATCH_REMOVE_PARENS_11_ARG(_0, _1, _2, _3, _4, _5, _6, _7, _8, _9, _10) \
    INTERNAL_CATCH_REMOVE_PARENS(_0),                                                    \
            INTERNAL_CATCH_REMOVE_PARENS_10_ARG(_1, _2, _3, _4, _5, _6, _7, _8, _9, _10)

#define INTERNAL_CATCH_VA_NARGS_IMPL(_0, _1, _2, _3, _4, _5, _6, _7, _8, _9, _10, N, ...) N

#define INTERNAL_CATCH_TYPE_GEN                                                                 \
    template <typename...>                                                                      \
    struct TypeList {};                                                                         \
    template <typename... Ts>                                                                   \
    constexpr auto get_wrapper() noexcept->TypeList<Ts...> {                                    \
        return {};                                                                              \
    }                                                                                           \
    template <template <typename...> class...>                                                  \
    struct TemplateTypeList {};                                                                 \
    template <template <typename...> class... Cs>                                               \
    constexpr auto get_wrapper() noexcept->TemplateTypeList<Cs...> {                            \
        return {};                                                                              \
    }                                                                                           \
    template <typename...>                                                                      \
    struct append;                                                                              \
    template <typename...>                                                                      \
    struct rewrap;                                                                              \
    template <template <typename...> class, typename...>                                        \
    struct create;                                                                              \
    template <template <typename...> class, typename>                                           \
    struct convert;                                                                             \
                                                                                                \
    template <typename T>                                                                       \
    struct append<T> {                                                                          \
        using type = T;                                                                         \
    };                                                                                          \
    template <template <typename...> class L1, typename... E1, template <typename...> class L2, \
              typename... E2, typename... Rest>                                                 \
    struct append<L1<E1...>, L2<E2...>, Rest...> {                                              \
        using type = typename append<L1<E1..., E2...>, Rest...>::type;                          \
    };                                                                                          \
    template <template <typename...> class L1, typename... E1, typename... Rest>                \
    struct append<L1<E1...>, TypeList<mpl_::na>, Rest...> {                                     \
        using type = L1<E1...>;                                                                 \
    };                                                                                          \
                                                                                                \
    template <template <typename...> class Container, template <typename...> class List,        \
              typename... elems>                                                                \
    struct rewrap<TemplateTypeList<Container>, List<elems...>> {                                \
        using type = TypeList<Container<elems...>>;                                             \
    };                                                                                          \
    template <template <typename...> class Container, template <typename...> class List,        \
              class... Elems, typename... Elements>                                             \
    struct rewrap<TemplateTypeList<Container>, List<Elems...>, Elements...> {                   \
        using type = typename append<                                                           \
                TypeList<Container<Elems...>>,                                                  \
                typename rewrap<TemplateTypeList<Container>, Elements...>::type>::type;         \
    };                                                                                          \
                                                                                                \
    template <template <typename...> class Final, template <typename...> class... Containers,   \
              typename... Types>                                                                \
    struct create<Final, TemplateTypeList<Containers...>, TypeList<Types...>> {                 \
        using type = typename append<                                                           \
                Final<>,                                                                        \
                typename rewrap<TemplateTypeList<Containers>, Types...>::type...>::type;        \
    };                                                                                          \
    template <template <typename...> class Final, template <typename...> class List,            \
              typename... Ts>                                                                   \
    struct convert<Final, List<Ts...>> {                                                        \
        using type = typename append<Final<>, TypeList<Ts>...>::type;                           \
    };

#define INTERNAL_CATCH_NTTP_1(signature, ...)                                                \
    template <INTERNAL_CATCH_REMOVE_PARENS(signature)>                                       \
    struct Nttp {};                                                                          \
    template <INTERNAL_CATCH_REMOVE_PARENS(signature)>                                       \
    constexpr auto get_wrapper() noexcept->Nttp<__VA_ARGS__> {                               \
        return {};                                                                           \
    }                                                                                        \
    template <template <INTERNAL_CATCH_REMOVE_PARENS(signature)> class...>                   \
    struct NttpTemplateTypeList {};                                                          \
    template <template <INTERNAL_CATCH_REMOVE_PARENS(signature)> class... Cs>                \
    constexpr auto get_wrapper() noexcept->NttpTemplateTypeList<Cs...> {                     \
        return {};                                                                           \
    }                                                                                        \
                                                                                             \
    template <template <INTERNAL_CATCH_REMOVE_PARENS(signature)> class Container,            \
              template <INTERNAL_CATCH_REMOVE_PARENS(signature)> class List,                 \
              INTERNAL_CATCH_REMOVE_PARENS(signature)>                                       \
    struct rewrap<NttpTemplateTypeList<Container>, List<__VA_ARGS__>> {                      \
        using type = TypeList<Container<__VA_ARGS__>>;                                       \
    };                                                                                       \
    template <template <INTERNAL_CATCH_REMOVE_PARENS(signature)> class Container,            \
              template <INTERNAL_CATCH_REMOVE_PARENS(signature)> class List,                 \
              INTERNAL_CATCH_REMOVE_PARENS(signature), typename... Elements>                 \
    struct rewrap<NttpTemplateTypeList<Container>, List<__VA_ARGS__>, Elements...> {         \
        using type = typename append<                                                        \
                TypeList<Container<__VA_ARGS__>>,                                            \
                typename rewrap<NttpTemplateTypeList<Container>, Elements...>::type>::type;  \
    };                                                                                       \
    template <template <typename...> class Final,                                            \
              template <INTERNAL_CATCH_REMOVE_PARENS(signature)> class... Containers,        \
              typename... Types>                                                             \
    struct create<Final, NttpTemplateTypeList<Containers...>, TypeList<Types...>> {          \
        using type = typename append<                                                        \
                Final<>,                                                                     \
                typename rewrap<NttpTemplateTypeList<Containers>, Types...>::type...>::type; \
    };

#define INTERNAL_CATCH_DECLARE_SIG_TEST0(TestName)
#define INTERNAL_CATCH_DECLARE_SIG_TEST1(TestName, signature) \
    template <INTERNAL_CATCH_REMOVE_PARENS(signature)>        \
    static void TestName()
#define INTERNAL_CATCH_DECLARE_SIG_TEST_X(TestName, signature, ...) \
    template <INTERNAL_CATCH_REMOVE_PARENS(signature)>              \
    static void TestName()

#define INTERNAL_CATCH_DEFINE_SIG_TEST0(TestName)
#define INTERNAL_CATCH_DEFINE_SIG_TEST1(TestName, signature) \
    template <INTERNAL_CATCH_REMOVE_PARENS(signature)>       \
    static void TestName()
#define INTERNAL_CATCH_DEFINE_SIG_TEST_X(TestName, signature, ...) \
    template <INTERNAL_CATCH_REMOVE_PARENS(signature)>             \
    static void TestName()

#define INTERNAL_CATCH_NTTP_REGISTER0(TestFunc, signature)                               \
    template <typename Type>                                                             \
    void reg_test(TypeList<Type>, Catch::NameAndTags nameAndTags) {                      \
        Catch::AutoReg(Catch::makeTestInvoker(&TestFunc<Type>), CATCH_INTERNAL_LINEINFO, \
                       Catch::StringRef(), nameAndTags);                                 \
    }

#define INTERNAL_CATCH_NTTP_REGISTER(TestFunc, signature, ...)                                  \
    template <INTERNAL_CATCH_REMOVE_PARENS(signature)>                                          \
    void reg_test(Nttp<__VA_ARGS__>, Catch::NameAndTags nameAndTags) {                          \
        Catch::AutoReg(Catch::makeTestInvoker(&TestFunc<__VA_ARGS__>), CATCH_INTERNAL_LINEINFO, \
                       Catch::StringRef(), nameAndTags);                                        \
    }

#define INTERNAL_CATCH_NTTP_REGISTER_METHOD0(TestName, signature, ...)                          \
    template <typename Type>                                                                    \
    void reg_test(TypeList<Type>, Catch::StringRef className, Catch::NameAndTags nameAndTags) { \
        Catch::AutoReg(Catch::makeTestInvoker(&TestName<Type>::test), CATCH_INTERNAL_LINEINFO,  \
                       className, nameAndTags);                                                 \
    }

#define INTERNAL_CATCH_NTTP_REGISTER_METHOD(TestName, signature, ...)                              \
    template <INTERNAL_CATCH_REMOVE_PARENS(signature)>                                             \
    void reg_test(Nttp<__VA_ARGS__>, Catch::StringRef className, Catch::NameAndTags nameAndTags) { \
        Catch::AutoReg(Catch::makeTestInvoker(&TestName<__VA_ARGS__>::test),                       \
                       CATCH_INTERNAL_LINEINFO, className, nameAndTags);                           \
    }

#define INTERNAL_CATCH_DECLARE_SIG_TEST_METHOD0(TestName, ClassName)
#define INTERNAL_CATCH_DECLARE_SIG_TEST_METHOD1(TestName, ClassName, signature) \
    template <typename TestType>                                                \
    struct TestName : INTERNAL_CATCH_REMOVE_PARENS(ClassName)<TestType> {       \
        void test();                                                            \
    }

#define INTERNAL_CATCH_DECLARE_SIG_TEST_METHOD_X(TestName, ClassName, signature, ...) \
    template <INTERNAL_CATCH_REMOVE_PARENS(signature)>                                \
    struct TestName : INTERNAL_CATCH_REMOVE_PARENS(ClassName)<__VA_ARGS__> {          \
        void test();                                                                  \
    }

#define INTERNAL_CATCH_DEFINE_SIG_TEST_METHOD0(TestName)
#define INTERNAL_CATCH_DEFINE_SIG_TEST_METHOD1(TestName, signature) \
    template <typename TestType>                                    \
    void INTERNAL_CATCH_MAKE_NAMESPACE(TestName)::TestName<TestType>::test()
#define INTERNAL_CATCH_DEFINE_SIG_TEST_METHOD_X(TestName, signature, ...) \
    template <INTERNAL_CATCH_REMOVE_PARENS(signature)>                    \
    void INTERNAL_CATCH_MAKE_NAMESPACE(TestName)::TestName<__VA_ARGS__>::test()

#ifndef CATCH_CONFIG_TRADITIONAL_MSVC_PREPROCESSOR
#define INTERNAL_CATCH_NTTP_0
#define INTERNAL_CATCH_NTTP_GEN(...)                                                             \
    INTERNAL_CATCH_VA_NARGS_IMPL(                                                                \
            __VA_ARGS__, INTERNAL_CATCH_NTTP_1(__VA_ARGS__), INTERNAL_CATCH_NTTP_1(__VA_ARGS__), \
            INTERNAL_CATCH_NTTP_1(__VA_ARGS__), INTERNAL_CATCH_NTTP_1(__VA_ARGS__),              \
            INTERNAL_CATCH_NTTP_1(__VA_ARGS__), INTERNAL_CATCH_NTTP_1(__VA_ARGS__),              \
            INTERNAL_CATCH_NTTP_1(__VA_ARGS__), INTERNAL_CATCH_NTTP_1(__VA_ARGS__),              \
            INTERNAL_CATCH_NTTP_1(__VA_ARGS__), INTERNAL_CATCH_NTTP_1(__VA_ARGS__),              \
            INTERNAL_CATCH_NTTP_0)
#define INTERNAL_CATCH_DEFINE_SIG_TEST_METHOD(TestName, ...)                                  \
    INTERNAL_CATCH_VA_NARGS_IMPL(                                                             \
            "dummy", __VA_ARGS__, INTERNAL_CATCH_DEFINE_SIG_TEST_METHOD_X,                    \
            INTERNAL_CATCH_DEFINE_SIG_TEST_METHOD_X, INTERNAL_CATCH_DEFINE_SIG_TEST_METHOD_X, \
            INTERNAL_CATCH_DEFINE_SIG_TEST_METHOD_X, INTERNAL_CATCH_DEFINE_SIG_TEST_METHOD_X, \
            INTERNAL_CATCH_DEFINE_SIG_TEST_METHOD_X, INTERNAL_CATCH_DEFINE_SIG_TEST_METHOD_X, \
            INTERNAL_CATCH_DEFINE_SIG_TEST_METHOD_X, INTERNAL_CATCH_DEFINE_SIG_TEST_METHOD_X, \
            INTERNAL_CATCH_DEFINE_SIG_TEST_METHOD1, INTERNAL_CATCH_DEFINE_SIG_TEST_METHOD0)   \
    (TestName, __VA_ARGS__)
#define INTERNAL_CATCH_DECLARE_SIG_TEST_METHOD(TestName, ClassName, ...)                        \
    INTERNAL_CATCH_VA_NARGS_IMPL(                                                               \
            "dummy", __VA_ARGS__, INTERNAL_CATCH_DECLARE_SIG_TEST_METHOD_X,                     \
            INTERNAL_CATCH_DECLARE_SIG_TEST_METHOD_X, INTERNAL_CATCH_DECLARE_SIG_TEST_METHOD_X, \
            INTERNAL_CATCH_DECLARE_SIG_TEST_METHOD_X, INTERNAL_CATCH_DECLARE_SIG_TEST_METHOD_X, \
            INTERNAL_CATCH_DECLARE_SIG_TEST_METHOD_X, INTERNAL_CATCH_DECLARE_SIG_TEST_METHOD_X, \
            INTERNAL_CATCH_DECLARE_SIG_TEST_METHOD_X, INTERNAL_CATCH_DECLARE_SIG_TEST_METHOD_X, \
            INTERNAL_CATCH_DECLARE_SIG_TEST_METHOD1, INTERNAL_CATCH_DECLARE_SIG_TEST_METHOD0)   \
    (TestName, ClassName, __VA_ARGS__)
#define INTERNAL_CATCH_NTTP_REG_METHOD_GEN(TestName, ...)                               \
    INTERNAL_CATCH_VA_NARGS_IMPL(                                                       \
            "dummy", __VA_ARGS__, INTERNAL_CATCH_NTTP_REGISTER_METHOD,                  \
            INTERNAL_CATCH_NTTP_REGISTER_METHOD, INTERNAL_CATCH_NTTP_REGISTER_METHOD,   \
            INTERNAL_CATCH_NTTP_REGISTER_METHOD, INTERNAL_CATCH_NTTP_REGISTER_METHOD,   \
            INTERNAL_CATCH_NTTP_REGISTER_METHOD, INTERNAL_CATCH_NTTP_REGISTER_METHOD,   \
            INTERNAL_CATCH_NTTP_REGISTER_METHOD, INTERNAL_CATCH_NTTP_REGISTER_METHOD,   \
            INTERNAL_CATCH_NTTP_REGISTER_METHOD0, INTERNAL_CATCH_NTTP_REGISTER_METHOD0) \
    (TestName, __VA_ARGS__)
#define INTERNAL_CATCH_NTTP_REG_GEN(TestFunc, ...)                                             \
    INTERNAL_CATCH_VA_NARGS_IMPL("dummy", __VA_ARGS__, INTERNAL_CATCH_NTTP_REGISTER,           \
                                 INTERNAL_CATCH_NTTP_REGISTER, INTERNAL_CATCH_NTTP_REGISTER,   \
                                 INTERNAL_CATCH_NTTP_REGISTER, INTERNAL_CATCH_NTTP_REGISTER,   \
                                 INTERNAL_CATCH_NTTP_REGISTER, INTERNAL_CATCH_NTTP_REGISTER,   \
                                 INTERNAL_CATCH_NTTP_REGISTER, INTERNAL_CATCH_NTTP_REGISTER,   \
                                 INTERNAL_CATCH_NTTP_REGISTER0, INTERNAL_CATCH_NTTP_REGISTER0) \
    (TestFunc, __VA_ARGS__)
#define INTERNAL_CATCH_DEFINE_SIG_TEST(TestName, ...)                           \
    INTERNAL_CATCH_VA_NARGS_IMPL(                                               \
            "dummy", __VA_ARGS__, INTERNAL_CATCH_DEFINE_SIG_TEST_X,             \
            INTERNAL_CATCH_DEFINE_SIG_TEST_X, INTERNAL_CATCH_DEFINE_SIG_TEST_X, \
            INTERNAL_CATCH_DEFINE_SIG_TEST_X, INTERNAL_CATCH_DEFINE_SIG_TEST_X, \
            INTERNAL_CATCH_DEFINE_SIG_TEST_X, INTERNAL_CATCH_DEFINE_SIG_TEST_X, \
            INTERNAL_CATCH_DEFINE_SIG_TEST_X, INTERNAL_CATCH_DEFINE_SIG_TEST_X, \
            INTERNAL_CATCH_DEFINE_SIG_TEST1, INTERNAL_CATCH_DEFINE_SIG_TEST0)   \
    (TestName, __VA_ARGS__)
#define INTERNAL_CATCH_DECLARE_SIG_TEST(TestName, ...)                            \
    INTERNAL_CATCH_VA_NARGS_IMPL(                                                 \
            "dummy", __VA_ARGS__, INTERNAL_CATCH_DECLARE_SIG_TEST_X,              \
            INTERNAL_CATCH_DECLARE_SIG_TEST_X, INTERNAL_CATCH_DECLARE_SIG_TEST_X, \
            INTERNAL_CATCH_DECLARE_SIG_TEST_X, INTERNAL_CATCH_DECLARE_SIG_TEST_X, \
            INTERNAL_CATCH_DECLARE_SIG_TEST_X, INTERNAL_CATCH_DEFINE_SIG_TEST_X,  \
            INTERNAL_CATCH_DECLARE_SIG_TEST_X, INTERNAL_CATCH_DECLARE_SIG_TEST_X, \
            INTERNAL_CATCH_DECLARE_SIG_TEST1, INTERNAL_CATCH_DECLARE_SIG_TEST0)   \
    (TestName, __VA_ARGS__)
#define INTERNAL_CATCH_REMOVE_PARENS_GEN(...)                                                      \
    INTERNAL_CATCH_VA_NARGS_IMPL(                                                                  \
            __VA_ARGS__, INTERNAL_CATCH_REMOVE_PARENS_11_ARG, INTERNAL_CATCH_REMOVE_PARENS_10_ARG, \
            INTERNAL_CATCH_REMOVE_PARENS_9_ARG, INTERNAL_CATCH_REMOVE_PARENS_8_ARG,                \
            INTERNAL_CATCH_REMOVE_PARENS_7_ARG, INTERNAL_CATCH_REMOVE_PARENS_6_ARG,                \
            INTERNAL_CATCH_REMOVE_PARENS_5_ARG, INTERNAL_CATCH_REMOVE_PARENS_4_ARG,                \
            INTERNAL_CATCH_REMOVE_PARENS_3_ARG, INTERNAL_CATCH_REMOVE_PARENS_2_ARG,                \
            INTERNAL_CATCH_REMOVE_PARENS_1_ARG)                                                    \
    (__VA_ARGS__)
#else
#define INTERNAL_CATCH_NTTP_0(signature)
#define INTERNAL_CATCH_NTTP_GEN(...)                                                          \
    INTERNAL_CATCH_EXPAND_VARGS(INTERNAL_CATCH_VA_NARGS_IMPL(                                 \
            __VA_ARGS__, INTERNAL_CATCH_NTTP_1, INTERNAL_CATCH_NTTP_1, INTERNAL_CATCH_NTTP_1, \
            INTERNAL_CATCH_NTTP_1, INTERNAL_CATCH_NTTP_1, INTERNAL_CATCH_NTTP_1,              \
            INTERNAL_CATCH_NTTP_1, INTERNAL_CATCH_NTTP_1, INTERNAL_CATCH_NTTP_1,              \
            INTERNAL_CATCH_NTTP_1, INTERNAL_CATCH_NTTP_0)(__VA_ARGS__))
#define INTERNAL_CATCH_DEFINE_SIG_TEST_METHOD(TestName, ...)                                  \
    INTERNAL_CATCH_EXPAND_VARGS(INTERNAL_CATCH_VA_NARGS_IMPL(                                 \
            "dummy", __VA_ARGS__, INTERNAL_CATCH_DEFINE_SIG_TEST_METHOD_X,                    \
            INTERNAL_CATCH_DEFINE_SIG_TEST_METHOD_X, INTERNAL_CATCH_DEFINE_SIG_TEST_METHOD_X, \
            INTERNAL_CATCH_DEFINE_SIG_TEST_METHOD_X, INTERNAL_CATCH_DEFINE_SIG_TEST_METHOD_X, \
            INTERNAL_CATCH_DEFINE_SIG_TEST_METHOD_X, INTERNAL_CATCH_DEFINE_SIG_TEST_METHOD_X, \
            INTERNAL_CATCH_DEFINE_SIG_TEST_METHOD_X, INTERNAL_CATCH_DEFINE_SIG_TEST_METHOD_X, \
            INTERNAL_CATCH_DEFINE_SIG_TEST_METHOD1,                                           \
            INTERNAL_CATCH_DEFINE_SIG_TEST_METHOD0)(TestName, __VA_ARGS__))
#define INTERNAL_CATCH_DECLARE_SIG_TEST_METHOD(TestName, ClassName, ...)                        \
    INTERNAL_CATCH_EXPAND_VARGS(INTERNAL_CATCH_VA_NARGS_IMPL(                                   \
            "dummy", __VA_ARGS__, INTERNAL_CATCH_DECLARE_SIG_TEST_METHOD_X,                     \
            INTERNAL_CATCH_DECLARE_SIG_TEST_METHOD_X, INTERNAL_CATCH_DECLARE_SIG_TEST_METHOD_X, \
            INTERNAL_CATCH_DECLARE_SIG_TEST_METHOD_X, INTERNAL_CATCH_DECLARE_SIG_TEST_METHOD_X, \
            INTERNAL_CATCH_DECLARE_SIG_TEST_METHOD_X, INTERNAL_CATCH_DECLARE_SIG_TEST_METHOD_X, \
            INTERNAL_CATCH_DECLARE_SIG_TEST_METHOD_X, INTERNAL_CATCH_DECLARE_SIG_TEST_METHOD_X, \
            INTERNAL_CATCH_DECLARE_SIG_TEST_METHOD1,                                            \
            INTERNAL_CATCH_DECLARE_SIG_TEST_METHOD0)(TestName, ClassName, __VA_ARGS__))
#define INTERNAL_CATCH_NTTP_REG_METHOD_GEN(TestName, ...)                             \
    INTERNAL_CATCH_EXPAND_VARGS(INTERNAL_CATCH_VA_NARGS_IMPL(                         \
            "dummy", __VA_ARGS__, INTERNAL_CATCH_NTTP_REGISTER_METHOD,                \
            INTERNAL_CATCH_NTTP_REGISTER_METHOD, INTERNAL_CATCH_NTTP_REGISTER_METHOD, \
            INTERNAL_CATCH_NTTP_REGISTER_METHOD, INTERNAL_CATCH_NTTP_REGISTER_METHOD, \
            INTERNAL_CATCH_NTTP_REGISTER_METHOD, INTERNAL_CATCH_NTTP_REGISTER_METHOD, \
            INTERNAL_CATCH_NTTP_REGISTER_METHOD, INTERNAL_CATCH_NTTP_REGISTER_METHOD, \
            INTERNAL_CATCH_NTTP_REGISTER_METHOD0,                                     \
            INTERNAL_CATCH_NTTP_REGISTER_METHOD0)(TestName, __VA_ARGS__))
#define INTERNAL_CATCH_NTTP_REG_GEN(TestFunc, ...)                                            \
    INTERNAL_CATCH_EXPAND_VARGS(INTERNAL_CATCH_VA_NARGS_IMPL(                                 \
            "dummy", __VA_ARGS__, INTERNAL_CATCH_NTTP_REGISTER, INTERNAL_CATCH_NTTP_REGISTER, \
            INTERNAL_CATCH_NTTP_REGISTER, INTERNAL_CATCH_NTTP_REGISTER,                       \
            INTERNAL_CATCH_NTTP_REGISTER, INTERNAL_CATCH_NTTP_REGISTER,                       \
            INTERNAL_CATCH_NTTP_REGISTER, INTERNAL_CATCH_NTTP_REGISTER,                       \
            INTERNAL_CATCH_NTTP_REGISTER, INTERNAL_CATCH_NTTP_REGISTER0,                      \
            INTERNAL_CATCH_NTTP_REGISTER0)(TestFunc, __VA_ARGS__))
#define INTERNAL_CATCH_DEFINE_SIG_TEST(TestName, ...)                           \
    INTERNAL_CATCH_EXPAND_VARGS(INTERNAL_CATCH_VA_NARGS_IMPL(                   \
            "dummy", __VA_ARGS__, INTERNAL_CATCH_DEFINE_SIG_TEST_X,             \
            INTERNAL_CATCH_DEFINE_SIG_TEST_X, INTERNAL_CATCH_DEFINE_SIG_TEST_X, \
            INTERNAL_CATCH_DEFINE_SIG_TEST_X, INTERNAL_CATCH_DEFINE_SIG_TEST_X, \
            INTERNAL_CATCH_DEFINE_SIG_TEST_X, INTERNAL_CATCH_DEFINE_SIG_TEST_X, \
            INTERNAL_CATCH_DEFINE_SIG_TEST_X, INTERNAL_CATCH_DEFINE_SIG_TEST_X, \
            INTERNAL_CATCH_DEFINE_SIG_TEST1,                                    \
            INTERNAL_CATCH_DEFINE_SIG_TEST0)(TestName, __VA_ARGS__))
#define INTERNAL_CATCH_DECLARE_SIG_TEST(TestName, ...)                            \
    INTERNAL_CATCH_EXPAND_VARGS(INTERNAL_CATCH_VA_NARGS_IMPL(                     \
            "dummy", __VA_ARGS__, INTERNAL_CATCH_DECLARE_SIG_TEST_X,              \
            INTERNAL_CATCH_DECLARE_SIG_TEST_X, INTERNAL_CATCH_DECLARE_SIG_TEST_X, \
            INTERNAL_CATCH_DECLARE_SIG_TEST_X, INTERNAL_CATCH_DECLARE_SIG_TEST_X, \
            INTERNAL_CATCH_DECLARE_SIG_TEST_X, INTERNAL_CATCH_DEFINE_SIG_TEST_X,  \
            INTERNAL_CATCH_DECLARE_SIG_TEST_X, INTERNAL_CATCH_DECLARE_SIG_TEST_X, \
            INTERNAL_CATCH_DECLARE_SIG_TEST1,                                     \
            INTERNAL_CATCH_DECLARE_SIG_TEST0)(TestName, __VA_ARGS__))
#define INTERNAL_CATCH_REMOVE_PARENS_GEN(...)                                                      \
    INTERNAL_CATCH_EXPAND_VARGS(INTERNAL_CATCH_VA_NARGS_IMPL(                                      \
            __VA_ARGS__, INTERNAL_CATCH_REMOVE_PARENS_11_ARG, INTERNAL_CATCH_REMOVE_PARENS_10_ARG, \
            INTERNAL_CATCH_REMOVE_PARENS_9_ARG, INTERNAL_CATCH_REMOVE_PARENS_8_ARG,                \
            INTERNAL_CATCH_REMOVE_PARENS_7_ARG, INTERNAL_CATCH_REMOVE_PARENS_6_ARG,                \
            INTERNAL_CATCH_REMOVE_PARENS_5_ARG, INTERNAL_CATCH_REMOVE_PARENS_4_ARG,                \
            INTERNAL_CATCH_REMOVE_PARENS_3_ARG, INTERNAL_CATCH_REMOVE_PARENS_2_ARG,                \
            INTERNAL_CATCH_REMOVE_PARENS_1_ARG)(__VA_ARGS__))
#endif

// end catch_preprocessor.hpp
// start catch_meta.hpp

#include <type_traits>

namespace Catch {
template <typename T>
struct always_false : std::false_type {};

template <typename>
struct true_given : std::true_type {};
struct is_callable_tester {
    template <typename Fun, typename... Args>
    true_given<decltype(std::declval<Fun>()(std::declval<Args>()...))> static test(int);
    template <typename...>
    std::false_type static test(...);
};

template <typename T>
struct is_callable;

template <typename Fun, typename... Args>
struct is_callable<Fun(Args...)> : decltype(is_callable_tester::test<Fun, Args...>(0)) {};

#if defined(__cpp_lib_is_invocable) && __cpp_lib_is_invocable >= 201703
// std::result_of is deprecated in C++17 and removed in C++20. Hence, it is
// replaced with std::invoke_result here.
template <typename Func, typename... U>
using FunctionReturnType =
        std::remove_reference_t<std::remove_cv_t<std::invoke_result_t<Func, U...>>>;
#else
// Keep ::type here because we still support C++11
template <typename Func, typename... U>
using FunctionReturnType = typename std::remove_reference<
        typename std::remove_cv<typename std::result_of<Func(U...)>::type>::type>::type;
#endif

}  // namespace Catch

namespace mpl_ {
struct na;
}

// end catch_meta.hpp
namespace Catch {

template <typename C>
class TestInvokerAsMethod : public ITestInvoker {
    void (C::*m_testAsMethod)();

public:
    TestInvokerAsMethod(void (C::*testAsMethod)()) noexcept : m_testAsMethod(testAsMethod) {}

    void invoke() const override {
        C obj;
        (obj.*m_testAsMethod)();
    }
};

auto makeTestInvoker(void (*testAsFunction)()) noexcept -> ITestInvoker *;

template <typename C>
auto makeTestInvoker(void (C::*testAsMethod)()) noexcept -> ITestInvoker * {
    return new (std::nothrow) TestInvokerAsMethod<C>(testAsMethod);
}

struct NameAndTags {
    NameAndTags(StringRef const &name_ = StringRef(),
                StringRef const &tags_ = StringRef()) noexcept;
    StringRef name;
    StringRef tags;
};

struct AutoReg : NonCopyable {
    AutoReg(ITestInvoker *invoker,
            SourceLineInfo const &lineInfo,
            StringRef const &classOrMethod,
            NameAndTags const &nameAndTags) noexcept;
    ~AutoReg();
};

}  // end namespace Catch

#if defined(CATCH_CONFIG_DISABLE)
#define INTERNAL_CATCH_TESTCASE_NO_REGISTRATION(TestName, ...) static void TestName()
#define INTERNAL_CATCH_TESTCASE_METHOD_NO_REGISTRATION(TestName, ClassName, ...) \
    namespace {                                                                  \
    struct TestName : INTERNAL_CATCH_REMOVE_PARENS(ClassName) {                  \
        void test();                                                             \
    };                                                                           \
    }                                                                            \
    void TestName::test()
#define INTERNAL_CATCH_TEMPLATE_TEST_CASE_NO_REGISTRATION_2(TestName, TestFunc, Name, Tags, \
                                                            Signature, ...)                 \
    INTERNAL_CATCH_DEFINE_SIG_TEST(TestFunc, INTERNAL_CATCH_REMOVE_PARENS(Signature))
#define INTERNAL_CATCH_TEMPLATE_TEST_CASE_METHOD_NO_REGISTRATION_2(                      \
        TestNameClass, TestName, ClassName, Name, Tags, Signature, ...)                  \
    namespace {                                                                          \
    namespace INTERNAL_CATCH_MAKE_NAMESPACE(TestName) {                                  \
        INTERNAL_CATCH_DECLARE_SIG_TEST_METHOD(TestName, ClassName,                      \
                                               INTERNAL_CATCH_REMOVE_PARENS(Signature)); \
    }                                                                                    \
    }                                                                                    \
    INTERNAL_CATCH_DEFINE_SIG_TEST_METHOD(TestName, INTERNAL_CATCH_REMOVE_PARENS(Signature))

#ifndef CATCH_CONFIG_TRADITIONAL_MSVC_PREPROCESSOR
#define INTERNAL_CATCH_TEMPLATE_TEST_CASE_NO_REGISTRATION(Name, Tags, ...)               \
    INTERNAL_CATCH_TEMPLATE_TEST_CASE_NO_REGISTRATION_2(                                 \
            INTERNAL_CATCH_UNIQUE_NAME(____C_A_T_C_H____T_E_M_P_L_A_T_E____T_E_S_T____), \
            INTERNAL_CATCH_UNIQUE_NAME(                                                  \
                    ____C_A_T_C_H____T_E_M_P_L_A_T_E____T_E_S_T____F_U_N_C____),         \
            Name, Tags, typename TestType, __VA_ARGS__)
#else
#define INTERNAL_CATCH_TEMPLATE_TEST_CASE_NO_REGISTRATION(Name, Tags, ...)               \
    INTERNAL_CATCH_EXPAND_VARGS(INTERNAL_CATCH_TEMPLATE_TEST_CASE_NO_REGISTRATION_2(     \
            INTERNAL_CATCH_UNIQUE_NAME(____C_A_T_C_H____T_E_M_P_L_A_T_E____T_E_S_T____), \
            INTERNAL_CATCH_UNIQUE_NAME(                                                  \
                    ____C_A_T_C_H____T_E_M_P_L_A_T_E____T_E_S_T____F_U_N_C____),         \
            Name, Tags, typename TestType, __VA_ARGS__))
#endif

#ifndef CATCH_CONFIG_TRADITIONAL_MSVC_PREPROCESSOR
#define INTERNAL_CATCH_TEMPLATE_TEST_CASE_SIG_NO_REGISTRATION(Name, Tags, Signature, ...) \
    INTERNAL_CATCH_TEMPLATE_TEST_CASE_NO_REGISTRATION_2(                                  \
            INTERNAL_CATCH_UNIQUE_NAME(____C_A_T_C_H____T_E_M_P_L_A_T_E____T_E_S_T____),  \
            INTERNAL_CATCH_UNIQUE_NAME(                                                   \
                    ____C_A_T_C_H____T_E_M_P_L_A_T_E____T_E_S_T____F_U_N_C____),          \
            Name, Tags, Signature, __VA_ARGS__)
#else
#define INTERNAL_CATCH_TEMPLATE_TEST_CASE_SIG_NO_REGISTRATION(Name, Tags, Signature, ...) \
    INTERNAL_CATCH_EXPAND_VARGS(INTERNAL_CATCH_TEMPLATE_TEST_CASE_NO_REGISTRATION_2(      \
            INTERNAL_CATCH_UNIQUE_NAME(____C_A_T_C_H____T_E_M_P_L_A_T_E____T_E_S_T____),  \
            INTERNAL_CATCH_UNIQUE_NAME(                                                   \
                    ____C_A_T_C_H____T_E_M_P_L_A_T_E____T_E_S_T____F_U_N_C____),          \
            Name, Tags, Signature, __VA_ARGS__))
#endif

#ifndef CATCH_CONFIG_TRADITIONAL_MSVC_PREPROCESSOR
#define INTERNAL_CATCH_TEMPLATE_TEST_CASE_METHOD_NO_REGISTRATION(ClassName, Name, Tags, ...) \
    INTERNAL_CATCH_TEMPLATE_TEST_CASE_METHOD_NO_REGISTRATION_2(                              \
            INTERNAL_CATCH_UNIQUE_NAME(                                                      \
                    ____C_A_T_C_H____T_E_M_P_L_A_T_E____T_E_S_T____C_L_A_S_S____),           \
            INTERNAL_CATCH_UNIQUE_NAME(____C_A_T_C_H____T_E_M_P_L_A_T_E____T_E_S_T____),     \
            ClassName, Name, Tags, typename T, __VA_ARGS__)
#else
#define INTERNAL_CATCH_TEMPLATE_TEST_CASE_METHOD_NO_REGISTRATION(ClassName, Name, Tags, ...) \
    INTERNAL_CATCH_EXPAND_VARGS(INTERNAL_CATCH_TEMPLATE_TEST_CASE_METHOD_NO_REGISTRATION_2(  \
            INTERNAL_CATCH_UNIQUE_NAME(                                                      \
                    ____C_A_T_C_H____T_E_M_P_L_A_T_E____T_E_S_T____C_L_A_S_S____),           \
            INTERNAL_CATCH_UNIQUE_NAME(____C_A_T_C_H____T_E_M_P_L_A_T_E____T_E_S_T____),     \
            ClassName, Name, Tags, typename T, __VA_ARGS__))
#endif

#ifndef CATCH_CONFIG_TRADITIONAL_MSVC_PREPROCESSOR
#define INTERNAL_CATCH_TEMPLATE_TEST_CASE_METHOD_SIG_NO_REGISTRATION(ClassName, Name, Tags, \
                                                                     Signature, ...)        \
    INTERNAL_CATCH_TEMPLATE_TEST_CASE_METHOD_NO_REGISTRATION_2(                             \
            INTERNAL_CATCH_UNIQUE_NAME(                                                     \
                    ____C_A_T_C_H____T_E_M_P_L_A_T_E____T_E_S_T____C_L_A_S_S____),          \
            INTERNAL_CATCH_UNIQUE_NAME(____C_A_T_C_H____T_E_M_P_L_A_T_E____T_E_S_T____),    \
            ClassName, Name, Tags, Signature, __VA_ARGS__)
#else
#define INTERNAL_CATCH_TEMPLATE_TEST_CASE_METHOD_SIG_NO_REGISTRATION(ClassName, Name, Tags, \
                                                                     Signature, ...)        \
    INTERNAL_CATCH_EXPAND_VARGS(INTERNAL_CATCH_TEMPLATE_TEST_CASE_METHOD_NO_REGISTRATION_2( \
            INTERNAL_CATCH_UNIQUE_NAME(                                                     \
                    ____C_A_T_C_H____T_E_M_P_L_A_T_E____T_E_S_T____C_L_A_S_S____),          \
            INTERNAL_CATCH_UNIQUE_NAME(____C_A_T_C_H____T_E_M_P_L_A_T_E____T_E_S_T____),    \
            ClassName, Name, Tags, Signature, __VA_ARGS__))
#endif
#endif

///////////////////////////////////////////////////////////////////////////////
#define INTERNAL_CATCH_TESTCASE2(TestName, ...)                                                 \
    static void TestName();                                                                     \
    CATCH_INTERNAL_START_WARNINGS_SUPPRESSION                                                   \
    CATCH_INTERNAL_SUPPRESS_GLOBALS_WARNINGS                                                    \
    namespace {                                                                                 \
    Catch::AutoReg INTERNAL_CATCH_UNIQUE_NAME(autoRegistrar)(Catch::makeTestInvoker(&TestName), \
                                                             CATCH_INTERNAL_LINEINFO,           \
                                                             Catch::StringRef(),                \
                                                             Catch::NameAndTags{__VA_ARGS__});  \
    } /* NOLINT */                                                                              \
    CATCH_INTERNAL_STOP_WARNINGS_SUPPRESSION                                                    \
    static void TestName()
#define INTERNAL_CATCH_TESTCASE(...) \
    INTERNAL_CATCH_TESTCASE2(INTERNAL_CATCH_UNIQUE_NAME(____C_A_T_C_H____T_E_S_T____), __VA_ARGS__)

///////////////////////////////////////////////////////////////////////////////
#define INTERNAL_CATCH_METHOD_AS_TEST_CASE(QualifiedMethod, ...) \
    CATCH_INTERNAL_START_WARNINGS_SUPPRESSION                    \
    CATCH_INTERNAL_SUPPRESS_GLOBALS_WARNINGS                     \
    namespace {                                                  \
    Catch::AutoReg INTERNAL_CATCH_UNIQUE_NAME(autoRegistrar)(    \
            Catch::makeTestInvoker(&QualifiedMethod),            \
            CATCH_INTERNAL_LINEINFO,                             \
            "&" #QualifiedMethod,                                \
            Catch::NameAndTags{__VA_ARGS__});                    \
    } /* NOLINT */                                               \
    CATCH_INTERNAL_STOP_WARNINGS_SUPPRESSION

///////////////////////////////////////////////////////////////////////////////
#define INTERNAL_CATCH_TEST_CASE_METHOD2(TestName, ClassName, ...) \
    CATCH_INTERNAL_START_WARNINGS_SUPPRESSION                      \
    CATCH_INTERNAL_SUPPRESS_GLOBALS_WARNINGS                       \
    namespace {                                                    \
    struct TestName : INTERNAL_CATCH_REMOVE_PARENS(ClassName) {    \
        void test();                                               \
    };                                                             \
    Catch::AutoReg INTERNAL_CATCH_UNIQUE_NAME(autoRegistrar)(      \
            Catch::makeTestInvoker(&TestName::test),               \
            CATCH_INTERNAL_LINEINFO,                               \
            #ClassName,                                            \
            Catch::NameAndTags{__VA_ARGS__}); /* NOLINT */         \
    }                                                              \
    CATCH_INTERNAL_STOP_WARNINGS_SUPPRESSION                       \
    void TestName::test()
#define INTERNAL_CATCH_TEST_CASE_METHOD(ClassName, ...)                                        \
    INTERNAL_CATCH_TEST_CASE_METHOD2(INTERNAL_CATCH_UNIQUE_NAME(____C_A_T_C_H____T_E_S_T____), \
                                     ClassName, __VA_ARGS__)

///////////////////////////////////////////////////////////////////////////////
#define INTERNAL_CATCH_REGISTER_TESTCASE(Function, ...)                                    \
    CATCH_INTERNAL_START_WARNINGS_SUPPRESSION                                              \
    CATCH_INTERNAL_SUPPRESS_GLOBALS_WARNINGS                                               \
    Catch::AutoReg INTERNAL_CATCH_UNIQUE_NAME(autoRegistrar)(                              \
            Catch::makeTestInvoker(Function), CATCH_INTERNAL_LINEINFO, Catch::StringRef(), \
            Catch::NameAndTags{__VA_ARGS__}); /* NOLINT */                                 \
    CATCH_INTERNAL_STOP_WARNINGS_SUPPRESSION

///////////////////////////////////////////////////////////////////////////////
#define INTERNAL_CATCH_TEMPLATE_TEST_CASE_2(TestName, TestFunc, Name, Tags, Signature, ...)       \
    CATCH_INTERNAL_START_WARNINGS_SUPPRESSION                                                     \
    CATCH_INTERNAL_SUPPRESS_GLOBALS_WARNINGS                                                      \
    CATCH_INTERNAL_SUPPRESS_ZERO_VARIADIC_WARNINGS                                                \
    CATCH_INTERNAL_SUPPRESS_UNUSED_TEMPLATE_WARNINGS                                              \
    INTERNAL_CATCH_DECLARE_SIG_TEST(TestFunc, INTERNAL_CATCH_REMOVE_PARENS(Signature));           \
    namespace {                                                                                   \
    namespace INTERNAL_CATCH_MAKE_NAMESPACE(TestName) {                                           \
        INTERNAL_CATCH_TYPE_GEN                                                                   \
        INTERNAL_CATCH_NTTP_GEN(INTERNAL_CATCH_REMOVE_PARENS(Signature))                          \
        INTERNAL_CATCH_NTTP_REG_GEN(TestFunc, INTERNAL_CATCH_REMOVE_PARENS(Signature))            \
        template <typename... Types>                                                              \
        struct TestName {                                                                         \
            TestName() {                                                                          \
                int index = 0;                                                                    \
                constexpr char const *tmpl_types[] = {                                            \
                        CATCH_REC_LIST(INTERNAL_CATCH_STRINGIZE_WITHOUT_PARENS, __VA_ARGS__)};    \
                using expander = int[];                                                           \
                (void)expander{                                                                   \
                        (reg_test(Types{},                                                        \
                                  Catch::NameAndTags{Name " - " + std::string(tmpl_types[index]), \
                                                     Tags}),                                      \
                         index++)...}; /* NOLINT */                                               \
            }                                                                                     \
        };                                                                                        \
        static int INTERNAL_CATCH_UNIQUE_NAME(globalRegistrar) = []() {                           \
            TestName<INTERNAL_CATCH_MAKE_TYPE_LISTS_FROM_TYPES(__VA_ARGS__)>();                   \
            return 0;                                                                             \
        }();                                                                                      \
    }                                                                                             \
    }                                                                                             \
    CATCH_INTERNAL_STOP_WARNINGS_SUPPRESSION                                                      \
    INTERNAL_CATCH_DEFINE_SIG_TEST(TestFunc, INTERNAL_CATCH_REMOVE_PARENS(Signature))

#ifndef CATCH_CONFIG_TRADITIONAL_MSVC_PREPROCESSOR
#define INTERNAL_CATCH_TEMPLATE_TEST_CASE(Name, Tags, ...)                               \
    INTERNAL_CATCH_TEMPLATE_TEST_CASE_2(                                                 \
            INTERNAL_CATCH_UNIQUE_NAME(____C_A_T_C_H____T_E_M_P_L_A_T_E____T_E_S_T____), \
            INTERNAL_CATCH_UNIQUE_NAME(                                                  \
                    ____C_A_T_C_H____T_E_M_P_L_A_T_E____T_E_S_T____F_U_N_C____),         \
            Name, Tags, typename TestType, __VA_ARGS__)
#else
#define INTERNAL_CATCH_TEMPLATE_TEST_CASE(Name, Tags, ...)                               \
    INTERNAL_CATCH_EXPAND_VARGS(INTERNAL_CATCH_TEMPLATE_TEST_CASE_2(                     \
            INTERNAL_CATCH_UNIQUE_NAME(____C_A_T_C_H____T_E_M_P_L_A_T_E____T_E_S_T____), \
            INTERNAL_CATCH_UNIQUE_NAME(                                                  \
                    ____C_A_T_C_H____T_E_M_P_L_A_T_E____T_E_S_T____F_U_N_C____),         \
            Name, Tags, typename TestType, __VA_ARGS__))
#endif

#ifndef CATCH_CONFIG_TRADITIONAL_MSVC_PREPROCESSOR
#define INTERNAL_CATCH_TEMPLATE_TEST_CASE_SIG(Name, Tags, Signature, ...)                \
    INTERNAL_CATCH_TEMPLATE_TEST_CASE_2(                                                 \
            INTERNAL_CATCH_UNIQUE_NAME(____C_A_T_C_H____T_E_M_P_L_A_T_E____T_E_S_T____), \
            INTERNAL_CATCH_UNIQUE_NAME(                                                  \
                    ____C_A_T_C_H____T_E_M_P_L_A_T_E____T_E_S_T____F_U_N_C____),         \
            Name, Tags, Signature, __VA_ARGS__)
#else
#define INTERNAL_CATCH_TEMPLATE_TEST_CASE_SIG(Name, Tags, Signature, ...)                \
    INTERNAL_CATCH_EXPAND_VARGS(INTERNAL_CATCH_TEMPLATE_TEST_CASE_2(                     \
            INTERNAL_CATCH_UNIQUE_NAME(____C_A_T_C_H____T_E_M_P_L_A_T_E____T_E_S_T____), \
            INTERNAL_CATCH_UNIQUE_NAME(                                                  \
                    ____C_A_T_C_H____T_E_M_P_L_A_T_E____T_E_S_T____F_U_N_C____),         \
            Name, Tags, Signature, __VA_ARGS__))
#endif

#define INTERNAL_CATCH_TEMPLATE_PRODUCT_TEST_CASE2(TestName, TestFuncName, Name, Tags, Signature,  \
                                                   TmplTypes, TypesList)                           \
    CATCH_INTERNAL_START_WARNINGS_SUPPRESSION                                                      \
    CATCH_INTERNAL_SUPPRESS_GLOBALS_WARNINGS                                                       \
    CATCH_INTERNAL_SUPPRESS_ZERO_VARIADIC_WARNINGS                                                 \
    CATCH_INTERNAL_SUPPRESS_UNUSED_TEMPLATE_WARNINGS                                               \
    template <typename TestType>                                                                   \
    static void TestFuncName();                                                                    \
    namespace {                                                                                    \
    namespace INTERNAL_CATCH_MAKE_NAMESPACE(TestName) {                                            \
        INTERNAL_CATCH_TYPE_GEN                                                                    \
        INTERNAL_CATCH_NTTP_GEN(INTERNAL_CATCH_REMOVE_PARENS(Signature))                           \
        template <typename... Types>                                                               \
        struct TestName {                                                                          \
            void reg_tests() {                                                                     \
                int index = 0;                                                                     \
                using expander = int[];                                                            \
                constexpr char const *tmpl_types[] = {                                             \
                        CATCH_REC_LIST(INTERNAL_CATCH_STRINGIZE_WITHOUT_PARENS,                    \
                                       INTERNAL_CATCH_REMOVE_PARENS(TmplTypes))};                  \
                constexpr char const *types_list[] = {                                             \
                        CATCH_REC_LIST(INTERNAL_CATCH_STRINGIZE_WITHOUT_PARENS,                    \
                                       INTERNAL_CATCH_REMOVE_PARENS(TypesList))};                  \
                constexpr auto num_types = sizeof(types_list) / sizeof(types_list[0]);             \
                (void)expander{                                                                    \
                        (Catch::AutoReg(                                                           \
                                 Catch::makeTestInvoker(&TestFuncName<Types>),                     \
                                 CATCH_INTERNAL_LINEINFO, Catch::StringRef(),                      \
                                 Catch::NameAndTags{                                               \
                                         Name " - " + std::string(tmpl_types[index / num_types]) + \
                                                 "<" +                                             \
                                                 std::string(types_list[index % num_types]) + ">", \
                                         Tags}),                                                   \
                         index++)...}; /* NOLINT */                                                \
            }                                                                                      \
        };                                                                                         \
        static int INTERNAL_CATCH_UNIQUE_NAME(globalRegistrar) = []() {                            \
            using TestInit = typename create<                                                      \
                    TestName, decltype(get_wrapper<INTERNAL_CATCH_REMOVE_PARENS(TmplTypes)>()),    \
                    TypeList<INTERNAL_CATCH_MAKE_TYPE_LISTS_FROM_TYPES(                            \
                            INTERNAL_CATCH_REMOVE_PARENS(TypesList))>>::type;                      \
            TestInit t;                                                                            \
            t.reg_tests();                                                                         \
            return 0;                                                                              \
        }();                                                                                       \
    }                                                                                              \
    }                                                                                              \
    CATCH_INTERNAL_STOP_WARNINGS_SUPPRESSION                                                       \
    template <typename TestType>                                                                   \
    static void TestFuncName()

#ifndef CATCH_CONFIG_TRADITIONAL_MSVC_PREPROCESSOR
#define INTERNAL_CATCH_TEMPLATE_PRODUCT_TEST_CASE(Name, Tags, ...)                       \
    INTERNAL_CATCH_TEMPLATE_PRODUCT_TEST_CASE2(                                          \
            INTERNAL_CATCH_UNIQUE_NAME(____C_A_T_C_H____T_E_M_P_L_A_T_E____T_E_S_T____), \
            INTERNAL_CATCH_UNIQUE_NAME(                                                  \
                    ____C_A_T_C_H____T_E_M_P_L_A_T_E____T_E_S_T____F_U_N_C____),         \
            Name, Tags, typename T, __VA_ARGS__)
#else
#define INTERNAL_CATCH_TEMPLATE_PRODUCT_TEST_CASE(Name, Tags, ...)                       \
    INTERNAL_CATCH_EXPAND_VARGS(INTERNAL_CATCH_TEMPLATE_PRODUCT_TEST_CASE2(              \
            INTERNAL_CATCH_UNIQUE_NAME(____C_A_T_C_H____T_E_M_P_L_A_T_E____T_E_S_T____), \
            INTERNAL_CATCH_UNIQUE_NAME(                                                  \
                    ____C_A_T_C_H____T_E_M_P_L_A_T_E____T_E_S_T____F_U_N_C____),         \
            Name, Tags, typename T, __VA_ARGS__))
#endif

#ifndef CATCH_CONFIG_TRADITIONAL_MSVC_PREPROCESSOR
#define INTERNAL_CATCH_TEMPLATE_PRODUCT_TEST_CASE_SIG(Name, Tags, Signature, ...)        \
    INTERNAL_CATCH_TEMPLATE_PRODUCT_TEST_CASE2(                                          \
            INTERNAL_CATCH_UNIQUE_NAME(____C_A_T_C_H____T_E_M_P_L_A_T_E____T_E_S_T____), \
            INTERNAL_CATCH_UNIQUE_NAME(                                                  \
                    ____C_A_T_C_H____T_E_M_P_L_A_T_E____T_E_S_T____F_U_N_C____),         \
            Name, Tags, Signature, __VA_ARGS__)
#else
#define INTERNAL_CATCH_TEMPLATE_PRODUCT_TEST_CASE_SIG(Name, Tags, Signature, ...)        \
    INTERNAL_CATCH_EXPAND_VARGS(INTERNAL_CATCH_TEMPLATE_PRODUCT_TEST_CASE2(              \
            INTERNAL_CATCH_UNIQUE_NAME(____C_A_T_C_H____T_E_M_P_L_A_T_E____T_E_S_T____), \
            INTERNAL_CATCH_UNIQUE_NAME(                                                  \
                    ____C_A_T_C_H____T_E_M_P_L_A_T_E____T_E_S_T____F_U_N_C____),         \
            Name, Tags, Signature, __VA_ARGS__))
#endif

#define INTERNAL_CATCH_TEMPLATE_LIST_TEST_CASE_2(TestName, TestFunc, Name, Tags, TmplList)         \
    CATCH_INTERNAL_START_WARNINGS_SUPPRESSION                                                      \
    CATCH_INTERNAL_SUPPRESS_GLOBALS_WARNINGS                                                       \
    CATCH_INTERNAL_SUPPRESS_UNUSED_TEMPLATE_WARNINGS                                               \
    template <typename TestType>                                                                   \
    static void TestFunc();                                                                        \
    namespace {                                                                                    \
    namespace INTERNAL_CATCH_MAKE_NAMESPACE(TestName) {                                            \
        INTERNAL_CATCH_TYPE_GEN                                                                    \
        template <typename... Types>                                                               \
        struct TestName {                                                                          \
            void reg_tests() {                                                                     \
                int index = 0;                                                                     \
                using expander = int[];                                                            \
                (void)expander{                                                                    \
                        (Catch::AutoReg(                                                           \
                                 Catch::makeTestInvoker(&TestFunc<Types>),                         \
                                 CATCH_INTERNAL_LINEINFO, Catch::StringRef(),                      \
                                 Catch::NameAndTags{                                               \
                                         Name " - " +                                              \
                                                 std::string(INTERNAL_CATCH_STRINGIZE(TmplList)) + \
                                                 " - " + std::to_string(index),                    \
                                         Tags}),                                                   \
                         index++)...}; /* NOLINT */                                                \
            }                                                                                      \
        };                                                                                         \
        static int INTERNAL_CATCH_UNIQUE_NAME(globalRegistrar) = []() {                            \
            using TestInit = typename convert<TestName, TmplList>::type;                           \
            TestInit t;                                                                            \
            t.reg_tests();                                                                         \
            return 0;                                                                              \
        }();                                                                                       \
    }                                                                                              \
    }                                                                                              \
    CATCH_INTERNAL_STOP_WARNINGS_SUPPRESSION                                                       \
    template <typename TestType>                                                                   \
    static void TestFunc()

#define INTERNAL_CATCH_TEMPLATE_LIST_TEST_CASE(Name, Tags, TmplList)                     \
    INTERNAL_CATCH_TEMPLATE_LIST_TEST_CASE_2(                                            \
            INTERNAL_CATCH_UNIQUE_NAME(____C_A_T_C_H____T_E_M_P_L_A_T_E____T_E_S_T____), \
            INTERNAL_CATCH_UNIQUE_NAME(                                                  \
                    ____C_A_T_C_H____T_E_M_P_L_A_T_E____T_E_S_T____F_U_N_C____),         \
            Name, Tags, TmplList)

#define INTERNAL_CATCH_TEMPLATE_TEST_CASE_METHOD_2(TestNameClass, TestName, ClassName, Name, Tags, \
                                                   Signature, ...)                                 \
    CATCH_INTERNAL_START_WARNINGS_SUPPRESSION                                                      \
    CATCH_INTERNAL_SUPPRESS_GLOBALS_WARNINGS                                                       \
    CATCH_INTERNAL_SUPPRESS_ZERO_VARIADIC_WARNINGS                                                 \
    CATCH_INTERNAL_SUPPRESS_UNUSED_TEMPLATE_WARNINGS                                               \
    namespace {                                                                                    \
    namespace INTERNAL_CATCH_MAKE_NAMESPACE(TestName) {                                            \
        INTERNAL_CATCH_TYPE_GEN                                                                    \
        INTERNAL_CATCH_NTTP_GEN(INTERNAL_CATCH_REMOVE_PARENS(Signature))                           \
        INTERNAL_CATCH_DECLARE_SIG_TEST_METHOD(TestName, ClassName,                                \
                                               INTERNAL_CATCH_REMOVE_PARENS(Signature));           \
        INTERNAL_CATCH_NTTP_REG_METHOD_GEN(TestName, INTERNAL_CATCH_REMOVE_PARENS(Signature))      \
        template <typename... Types>                                                               \
        struct TestNameClass {                                                                     \
            TestNameClass() {                                                                      \
                int index = 0;                                                                     \
                constexpr char const *tmpl_types[] = {                                             \
                        CATCH_REC_LIST(INTERNAL_CATCH_STRINGIZE_WITHOUT_PARENS, __VA_ARGS__)};     \
                using expander = int[];                                                            \
                (void)expander{                                                                    \
                        (reg_test(Types{}, #ClassName,                                             \
                                  Catch::NameAndTags{Name " - " + std::string(tmpl_types[index]),  \
                                                     Tags}),                                       \
                         index++)...}; /* NOLINT */                                                \
            }                                                                                      \
        };                                                                                         \
        static int INTERNAL_CATCH_UNIQUE_NAME(globalRegistrar) = []() {                            \
            TestNameClass<INTERNAL_CATCH_MAKE_TYPE_LISTS_FROM_TYPES(__VA_ARGS__)>();               \
            return 0;                                                                              \
        }();                                                                                       \
    }                                                                                              \
    }                                                                                              \
    CATCH_INTERNAL_STOP_WARNINGS_SUPPRESSION                                                       \
    INTERNAL_CATCH_DEFINE_SIG_TEST_METHOD(TestName, INTERNAL_CATCH_REMOVE_PARENS(Signature))

#ifndef CATCH_CONFIG_TRADITIONAL_MSVC_PREPROCESSOR
#define INTERNAL_CATCH_TEMPLATE_TEST_CASE_METHOD(ClassName, Name, Tags, ...)             \
    INTERNAL_CATCH_TEMPLATE_TEST_CASE_METHOD_2(                                          \
            INTERNAL_CATCH_UNIQUE_NAME(                                                  \
                    ____C_A_T_C_H____T_E_M_P_L_A_T_E____T_E_S_T____C_L_A_S_S____),       \
            INTERNAL_CATCH_UNIQUE_NAME(____C_A_T_C_H____T_E_M_P_L_A_T_E____T_E_S_T____), \
            ClassName, Name, Tags, typename T, __VA_ARGS__)
#else
#define INTERNAL_CATCH_TEMPLATE_TEST_CASE_METHOD(ClassName, Name, Tags, ...)             \
    INTERNAL_CATCH_EXPAND_VARGS(INTERNAL_CATCH_TEMPLATE_TEST_CASE_METHOD_2(              \
            INTERNAL_CATCH_UNIQUE_NAME(                                                  \
                    ____C_A_T_C_H____T_E_M_P_L_A_T_E____T_E_S_T____C_L_A_S_S____),       \
            INTERNAL_CATCH_UNIQUE_NAME(____C_A_T_C_H____T_E_M_P_L_A_T_E____T_E_S_T____), \
            ClassName, Name, Tags, typename T, __VA_ARGS__))
#endif

#ifndef CATCH_CONFIG_TRADITIONAL_MSVC_PREPROCESSOR
#define INTERNAL_CATCH_TEMPLATE_TEST_CASE_METHOD_SIG(ClassName, Name, Tags, Signature, ...) \
    INTERNAL_CATCH_TEMPLATE_TEST_CASE_METHOD_2(                                             \
            INTERNAL_CATCH_UNIQUE_NAME(                                                     \
                    ____C_A_T_C_H____T_E_M_P_L_A_T_E____T_E_S_T____C_L_A_S_S____),          \
            INTERNAL_CATCH_UNIQUE_NAME(____C_A_T_C_H____T_E_M_P_L_A_T_E____T_E_S_T____),    \
            ClassName, Name, Tags, Signature, __VA_ARGS__)
#else
#define INTERNAL_CATCH_TEMPLATE_TEST_CASE_METHOD_SIG(ClassName, Name, Tags, Signature, ...) \
    INTERNAL_CATCH_EXPAND_VARGS(INTERNAL_CATCH_TEMPLATE_TEST_CASE_METHOD_2(                 \
            INTERNAL_CATCH_UNIQUE_NAME(                                                     \
                    ____C_A_T_C_H____T_E_M_P_L_A_T_E____T_E_S_T____C_L_A_S_S____),          \
            INTERNAL_CATCH_UNIQUE_NAME(____C_A_T_C_H____T_E_M_P_L_A_T_E____T_E_S_T____),    \
            ClassName, Name, Tags, Signature, __VA_ARGS__))
#endif

#define INTERNAL_CATCH_TEMPLATE_PRODUCT_TEST_CASE_METHOD_2(                                        \
        TestNameClass, TestName, ClassName, Name, Tags, Signature, TmplTypes, TypesList)           \
    CATCH_INTERNAL_START_WARNINGS_SUPPRESSION                                                      \
    CATCH_INTERNAL_SUPPRESS_GLOBALS_WARNINGS                                                       \
    CATCH_INTERNAL_SUPPRESS_ZERO_VARIADIC_WARNINGS                                                 \
    CATCH_INTERNAL_SUPPRESS_UNUSED_TEMPLATE_WARNINGS                                               \
    template <typename TestType>                                                                   \
    struct TestName : INTERNAL_CATCH_REMOVE_PARENS(ClassName<TestType>) {                          \
        void test();                                                                               \
    };                                                                                             \
    namespace {                                                                                    \
    namespace INTERNAL_CATCH_MAKE_NAMESPACE(TestNameClass) {                                       \
        INTERNAL_CATCH_TYPE_GEN                                                                    \
        INTERNAL_CATCH_NTTP_GEN(INTERNAL_CATCH_REMOVE_PARENS(Signature))                           \
        template <typename... Types>                                                               \
        struct TestNameClass {                                                                     \
            void reg_tests() {                                                                     \
                int index = 0;                                                                     \
                using expander = int[];                                                            \
                constexpr char const *tmpl_types[] = {                                             \
                        CATCH_REC_LIST(INTERNAL_CATCH_STRINGIZE_WITHOUT_PARENS,                    \
                                       INTERNAL_CATCH_REMOVE_PARENS(TmplTypes))};                  \
                constexpr char const *types_list[] = {                                             \
                        CATCH_REC_LIST(INTERNAL_CATCH_STRINGIZE_WITHOUT_PARENS,                    \
                                       INTERNAL_CATCH_REMOVE_PARENS(TypesList))};                  \
                constexpr auto num_types = sizeof(types_list) / sizeof(types_list[0]);             \
                (void)expander{                                                                    \
                        (Catch::AutoReg(                                                           \
                                 Catch::makeTestInvoker(&TestName<Types>::test),                   \
                                 CATCH_INTERNAL_LINEINFO, #ClassName,                              \
                                 Catch::NameAndTags{                                               \
                                         Name " - " + std::string(tmpl_types[index / num_types]) + \
                                                 "<" +                                             \
                                                 std::string(types_list[index % num_types]) + ">", \
                                         Tags}),                                                   \
                         index++)...}; /* NOLINT */                                                \
            }                                                                                      \
        };                                                                                         \
        static int INTERNAL_CATCH_UNIQUE_NAME(globalRegistrar) = []() {                            \
            using TestInit = typename create<                                                      \
                    TestNameClass,                                                                 \
                    decltype(get_wrapper<INTERNAL_CATCH_REMOVE_PARENS(TmplTypes)>()),              \
                    TypeList<INTERNAL_CATCH_MAKE_TYPE_LISTS_FROM_TYPES(                            \
                            INTERNAL_CATCH_REMOVE_PARENS(TypesList))>>::type;                      \
            TestInit t;                                                                            \
            t.reg_tests();                                                                         \
            return 0;                                                                              \
        }();                                                                                       \
    }                                                                                              \
    }                                                                                              \
    CATCH_INTERNAL_STOP_WARNINGS_SUPPRESSION                                                       \
    template <typename TestType>                                                                   \
    void TestName<TestType>::test()

#ifndef CATCH_CONFIG_TRADITIONAL_MSVC_PREPROCESSOR
#define INTERNAL_CATCH_TEMPLATE_PRODUCT_TEST_CASE_METHOD(ClassName, Name, Tags, ...)     \
    INTERNAL_CATCH_TEMPLATE_PRODUCT_TEST_CASE_METHOD_2(                                  \
            INTERNAL_CATCH_UNIQUE_NAME(____C_A_T_C_H____T_E_M_P_L_A_T_E____T_E_S_T____), \
            INTERNAL_CATCH_UNIQUE_NAME(                                                  \
                    ____C_A_T_C_H____T_E_M_P_L_A_T_E____T_E_S_T____F_U_N_C____),         \
            ClassName, Name, Tags, typename T, __VA_ARGS__)
#else
#define INTERNAL_CATCH_TEMPLATE_PRODUCT_TEST_CASE_METHOD(ClassName, Name, Tags, ...)     \
    INTERNAL_CATCH_EXPAND_VARGS(INTERNAL_CATCH_TEMPLATE_PRODUCT_TEST_CASE_METHOD_2(      \
            INTERNAL_CATCH_UNIQUE_NAME(____C_A_T_C_H____T_E_M_P_L_A_T_E____T_E_S_T____), \
            INTERNAL_CATCH_UNIQUE_NAME(                                                  \
                    ____C_A_T_C_H____T_E_M_P_L_A_T_E____T_E_S_T____F_U_N_C____),         \
            ClassName, Name, Tags, typename T, __VA_ARGS__))
#endif

#ifndef CATCH_CONFIG_TRADITIONAL_MSVC_PREPROCESSOR
#define INTERNAL_CATCH_TEMPLATE_PRODUCT_TEST_CASE_METHOD_SIG(ClassName, Name, Tags, Signature, \
                                                             ...)                              \
    INTERNAL_CATCH_TEMPLATE_PRODUCT_TEST_CASE_METHOD_2(                                        \
            INTERNAL_CATCH_UNIQUE_NAME(____C_A_T_C_H____T_E_M_P_L_A_T_E____T_E_S_T____),       \
            INTERNAL_CATCH_UNIQUE_NAME(                                                        \
                    ____C_A_T_C_H____T_E_M_P_L_A_T_E____T_E_S_T____F_U_N_C____),               \
            ClassName, Name, Tags, Signature, __VA_ARGS__)
#else
#define INTERNAL_CATCH_TEMPLATE_PRODUCT_TEST_CASE_METHOD_SIG(ClassName, Name, Tags, Signature, \
                                                             ...)                              \
    INTERNAL_CATCH_EXPAND_VARGS(INTERNAL_CATCH_TEMPLATE_PRODUCT_TEST_CASE_METHOD_2(            \
            INTERNAL_CATCH_UNIQUE_NAME(____C_A_T_C_H____T_E_M_P_L_A_T_E____T_E_S_T____),       \
            INTERNAL_CATCH_UNIQUE_NAME(                                                        \
                    ____C_A_T_C_H____T_E_M_P_L_A_T_E____T_E_S_T____F_U_N_C____),               \
            ClassName, Name, Tags, Signature, __VA_ARGS__))
#endif

#define INTERNAL_CATCH_TEMPLATE_LIST_TEST_CASE_METHOD_2(TestNameClass, TestName, ClassName, Name,  \
                                                        Tags, TmplList)                            \
    CATCH_INTERNAL_START_WARNINGS_SUPPRESSION                                                      \
    CATCH_INTERNAL_SUPPRESS_GLOBALS_WARNINGS                                                       \
    CATCH_INTERNAL_SUPPRESS_UNUSED_TEMPLATE_WARNINGS                                               \
    template <typename TestType>                                                                   \
    struct TestName : INTERNAL_CATCH_REMOVE_PARENS(ClassName<TestType>) {                          \
        void test();                                                                               \
    };                                                                                             \
    namespace {                                                                                    \
    namespace INTERNAL_CATCH_MAKE_NAMESPACE(TestName) {                                            \
        INTERNAL_CATCH_TYPE_GEN                                                                    \
        template <typename... Types>                                                               \
        struct TestNameClass {                                                                     \
            void reg_tests() {                                                                     \
                int index = 0;                                                                     \
                using expander = int[];                                                            \
                (void)expander{                                                                    \
                        (Catch::AutoReg(                                                           \
                                 Catch::makeTestInvoker(&TestName<Types>::test),                   \
                                 CATCH_INTERNAL_LINEINFO, #ClassName,                              \
                                 Catch::NameAndTags{                                               \
                                         Name " - " +                                              \
                                                 std::string(INTERNAL_CATCH_STRINGIZE(TmplList)) + \
                                                 " - " + std::to_string(index),                    \
                                         Tags}),                                                   \
                         index++)...}; /* NOLINT */                                                \
            }                                                                                      \
        };                                                                                         \
        static int INTERNAL_CATCH_UNIQUE_NAME(globalRegistrar) = []() {                            \
            using TestInit = typename convert<TestNameClass, TmplList>::type;                      \
            TestInit t;                                                                            \
            t.reg_tests();                                                                         \
            return 0;                                                                              \
        }();                                                                                       \
    }                                                                                              \
    }                                                                                              \
    CATCH_INTERNAL_STOP_WARNINGS_SUPPRESSION                                                       \
    template <typename TestType>                                                                   \
    void TestName<TestType>::test()

#define INTERNAL_CATCH_TEMPLATE_LIST_TEST_CASE_METHOD(ClassName, Name, Tags, TmplList)   \
    INTERNAL_CATCH_TEMPLATE_LIST_TEST_CASE_METHOD_2(                                     \
            INTERNAL_CATCH_UNIQUE_NAME(____C_A_T_C_H____T_E_M_P_L_A_T_E____T_E_S_T____), \
            INTERNAL_CATCH_UNIQUE_NAME(                                                  \
                    ____C_A_T_C_H____T_E_M_P_L_A_T_E____T_E_S_T____F_U_N_C____),         \
            ClassName, Name, Tags, TmplList)

// end catch_test_registry.h
// start catch_capture.hpp

// start catch_assertionhandler.h

// start catch_assertioninfo.h

// start catch_result_type.h

namespace Catch {

// ResultWas::OfType enum
struct ResultWas {
    enum OfType {
        Unknown = -1,
        Ok = 0,
        Info = 1,
        Warning = 2,

        FailureBit = 0x10,

        ExpressionFailed = FailureBit | 1,
        ExplicitFailure = FailureBit | 2,

        Exception = 0x100 | FailureBit,

        ThrewException = Exception | 1,
        DidntThrowException = Exception | 2,

        FatalErrorCondition = 0x200 | FailureBit

    };
};

bool isOk(ResultWas::OfType resultType);
bool isJustInfo(int flags);

// ResultDisposition::Flags enum
struct ResultDisposition {
    enum Flags {
        Normal = 0x01,

        ContinueOnFailure = 0x02,  // Failures fail test, but execution continues
        FalseTest = 0x04,          // Prefix expression with !
        SuppressFail = 0x08        // Failures are reported but do not fail the test
    };
};

ResultDisposition::Flags operator|(ResultDisposition::Flags lhs, ResultDisposition::Flags rhs);

bool shouldContinueOnFailure(int flags);
inline bool isFalseTest(int flags) { return (flags & ResultDisposition::FalseTest) != 0; }
bool shouldSuppressFailure(int flags);

}  // end namespace Catch

// end catch_result_type.h
namespace Catch {

struct AssertionInfo {
    StringRef macroName;
    SourceLineInfo lineInfo;
    StringRef capturedExpression;
    ResultDisposition::Flags resultDisposition;

    // We want to delete this constructor but a compiler bug in 4.8 means
    // the struct is then treated as non-aggregate
    // AssertionInfo() = delete;
};

}  // end namespace Catch

// end catch_assertioninfo.h
// start catch_decomposer.h

// start catch_tostring.h

#include <cstddef>
#include <string>
#include <type_traits>
#include <vector>
// start catch_stream.h

#include <cstddef>
#include <iosfwd>
#include <ostream>

namespace Catch {

std::ostream &cout();
std::ostream &cerr();
std::ostream &clog();

class StringRef;

struct IStream {
    virtual ~IStream();
    virtual std::ostream &stream() const = 0;
};

auto makeStream(StringRef const &filename) -> IStream const *;

class ReusableStringStream : NonCopyable {
    std::size_t m_index;
    std::ostream *m_oss;

public:
    ReusableStringStream();
    ~ReusableStringStream();

    auto str() const -> std::string;

    template <typename T>
    auto operator<<(T const &value) -> ReusableStringStream & {
        *m_oss << value;
        return *this;
    }
    auto get() -> std::ostream & { return *m_oss; }
};
}  // namespace Catch

// end catch_stream.h
// start catch_interfaces_enum_values_registry.h

#include <vector>

namespace Catch {

namespace Detail {
struct EnumInfo {
    StringRef m_name;
    std::vector<std::pair<int, StringRef>> m_values;

    ~EnumInfo();

    StringRef lookup(int value) const;
};
}  // namespace Detail

struct IMutableEnumValuesRegistry {
    virtual ~IMutableEnumValuesRegistry();

    virtual Detail::EnumInfo const &registerEnum(StringRef enumName,
                                                 StringRef allEnums,
                                                 std::vector<int> const &values) = 0;

    template <typename E>
    Detail::EnumInfo const &registerEnum(StringRef enumName,
                                         StringRef allEnums,
                                         std::initializer_list<E> values) {
        static_assert(sizeof(int) >= sizeof(E), "Cannot serialize enum to int");
        std::vector<int> intValues;
        intValues.reserve(values.size());
        for (auto enumValue : values)
            intValues.push_back(static_cast<int>(enumValue));
        return registerEnum(enumName, allEnums, intValues);
    }
};

}  // namespace Catch

// end catch_interfaces_enum_values_registry.h

#ifdef CATCH_CONFIG_CPP17_STRING_VIEW
#include <string_view>
#endif

#ifdef __OBJC__
// start catch_objc_arc.hpp

#import <Foundation/Foundation.h>

#ifdef __has_feature
#define CATCH_ARC_ENABLED __has_feature(objc_arc)
#else
#define CATCH_ARC_ENABLED 0
#endif

void arcSafeRelease(NSObject *obj);
id performOptionalSelector(id obj, SEL sel);

#if !CATCH_ARC_ENABLED
inline void arcSafeRelease(NSObject *obj) { [obj release]; }
inline id performOptionalSelector(id obj, SEL sel) {
    if ([obj respondsToSelector:sel])
        return [obj performSelector:sel];
    return nil;
}
#define CATCH_UNSAFE_UNRETAINED
#define CATCH_ARC_STRONG
#else
inline void arcSafeRelease(NSObject *) {}
inline id performOptionalSelector(id obj, SEL sel) {
#ifdef __clang__
#pragma clang diagnostic push
#pragma clang diagnostic ignored "-Warc-performSelector-leaks"
#endif
    if ([obj respondsToSelector:sel])
        return [obj performSelector:sel];
#ifdef __clang__
#pragma clang diagnostic pop
#endif
    return nil;
}
#define CATCH_UNSAFE_UNRETAINED __unsafe_unretained
#define CATCH_ARC_STRONG __strong
#endif

// end catch_objc_arc.hpp
#endif

#ifdef _MSC_VER
#pragma warning(push)
#pragma warning(disable : 4180)  // We attempt to stream a function (address) by const&, \
                                 // which MSVC complains about but is harmless
#endif

namespace Catch {
namespace Detail {

extern const std::string unprintableString;

std::string rawMemoryToString(const void *object, std::size_t size);

template <typename T>
std::string rawMemoryToString(const T &object) {
    return rawMemoryToString(&object, sizeof(object));
}

template <typename T>
class IsStreamInsertable {
    template <typename Stream, typename U>
    static auto test(int)
            -> decltype(std::declval<Stream &>() << std::declval<U>(), std::true_type());

    template <typename, typename>
    static auto test(...) -> std::false_type;

public:
    static const bool value = decltype(test<std::ostream, const T &>(0))::value;
};

template <typename E>
std::string convertUnknownEnumToString(E e);

template <typename T>
typename std::enable_if<!std::is_enum<T>::value && !std::is_base_of<std::exception, T>::value,
                        std::string>::type
convertUnstreamable(T const &) {
    return Detail::unprintableString;
}
template <typename T>
typename std::enable_if<!std::is_enum<T>::value && std::is_base_of<std::exception, T>::value,
                        std::string>::type
convertUnstreamable(T const &ex) {
    return ex.what();
}

template <typename T>
typename std::enable_if<std::is_enum<T>::value, std::string>::type convertUnstreamable(
        T const &value) {
    return convertUnknownEnumToString(value);
}

#if defined(_MANAGED)
//! Convert a CLR string to a utf8 std::string
template <typename T>
std::string clrReferenceToString(T ^ ref) {
    if (ref == nullptr)
        return std::string("null");
    auto bytes = System::Text::Encoding::UTF8->GetBytes(ref->ToString());
    cli::pin_ptr<System::Byte> p = &bytes[0];
    return std::string(reinterpret_cast<char const *>(p), bytes->Length);
}
#endif

}  // namespace Detail

// If we decide for C++14, change these to enable_if_ts
template <typename T, typename = void>
struct StringMaker {
    template <typename Fake = T>
    static typename std::enable_if<::Catch::Detail::IsStreamInsertable<Fake>::value,
                                   std::string>::type
    convert(const Fake &value) {
        ReusableStringStream rss;
        // NB: call using the function-like syntax to avoid ambiguity with
        // user-defined templated operator<< under clang.
        rss.operator<<(value);
        return rss.str();
    }

    template <typename Fake = T>
    static typename std::enable_if<!::Catch::Detail::IsStreamInsertable<Fake>::value,
                                   std::string>::type
    convert(const Fake &value) {
#if !defined(CATCH_CONFIG_FALLBACK_STRINGIFIER)
        return Detail::convertUnstreamable(value);
#else
        return CATCH_CONFIG_FALLBACK_STRINGIFIER(value);
#endif
    }
};

namespace Detail {

// This function dispatches all stringification requests inside of Catch.
// Should be preferably called fully qualified, like ::Catch::Detail::stringify
template <typename T>
std::string stringify(const T &e) {
    return ::Catch::StringMaker<
            typename std::remove_cv<typename std::remove_reference<T>::type>::type>::convert(e);
}

template <typename E>
std::string convertUnknownEnumToString(E e) {
    return ::Catch::Detail::stringify(static_cast<typename std::underlying_type<E>::type>(e));
}

#if defined(_MANAGED)
template <typename T>
std::string stringify(T ^ e) {
    return ::Catch::StringMaker<T ^>::convert(e);
}
#endif

}  // namespace Detail

// Some predefined specializations

template <>
struct StringMaker<std::string> {
    static std::string convert(const std::string &str);
};

#ifdef CATCH_CONFIG_CPP17_STRING_VIEW
template <>
struct StringMaker<std::string_view> {
    static std::string convert(std::string_view str);
};
#endif

template <>
struct StringMaker<char const *> {
    static std::string convert(char const *str);
};
template <>
struct StringMaker<char *> {
    static std::string convert(char *str);
};

#ifdef CATCH_CONFIG_WCHAR
template <>
struct StringMaker<std::wstring> {
    static std::string convert(const std::wstring &wstr);
};

#ifdef CATCH_CONFIG_CPP17_STRING_VIEW
template <>
struct StringMaker<std::wstring_view> {
    static std::string convert(std::wstring_view str);
};
#endif

template <>
struct StringMaker<wchar_t const *> {
    static std::string convert(wchar_t const *str);
};
template <>
struct StringMaker<wchar_t *> {
    static std::string convert(wchar_t *str);
};
#endif

// TBD: Should we use `strnlen` to ensure that we don't go out of the buffer,
//      while keeping string semantics?
template <int SZ>
struct StringMaker<char[SZ]> {
    static std::string convert(char const *str) {
        return ::Catch::Detail::stringify(std::string{str});
    }
};
template <int SZ>
struct StringMaker<signed char[SZ]> {
    static std::string convert(signed char const *str) {
        return ::Catch::Detail::stringify(std::string{reinterpret_cast<char const *>(str)});
    }
};
template <int SZ>
struct StringMaker<unsigned char[SZ]> {
    static std::string convert(unsigned char const *str) {
        return ::Catch::Detail::stringify(std::string{reinterpret_cast<char const *>(str)});
    }
};

#if defined(CATCH_CONFIG_CPP17_BYTE)
template <>
struct StringMaker<std::byte> {
    static std::string convert(std::byte value);
};
#endif  // defined(CATCH_CONFIG_CPP17_BYTE)
template <>
struct StringMaker<int> {
    static std::string convert(int value);
};
template <>
struct StringMaker<long> {
    static std::string convert(long value);
};
template <>
struct StringMaker<long long> {
    static std::string convert(long long value);
};
template <>
struct StringMaker<unsigned int> {
    static std::string convert(unsigned int value);
};
template <>
struct StringMaker<unsigned long> {
    static std::string convert(unsigned long value);
};
template <>
struct StringMaker<unsigned long long> {
    static std::string convert(unsigned long long value);
};

template <>
struct StringMaker<bool> {
    static std::string convert(bool b);
};

template <>
struct StringMaker<char> {
    static std::string convert(char c);
};
template <>
struct StringMaker<signed char> {
    static std::string convert(signed char c);
};
template <>
struct StringMaker<unsigned char> {
    static std::string convert(unsigned char c);
};

template <>
struct StringMaker<std::nullptr_t> {
    static std::string convert(std::nullptr_t);
};

template <>
struct StringMaker<float> {
    static std::string convert(float value);
    static int precision;
};

template <>
struct StringMaker<double> {
    static std::string convert(double value);
    static int precision;
};

template <typename T>
struct StringMaker<T *> {
    template <typename U>
    static std::string convert(U *p) {
        if (p) {
            return ::Catch::Detail::rawMemoryToString(p);
        } else {
            return "nullptr";
        }
    }
};

template <typename R, typename C>
struct StringMaker<R C::*> {
    static std::string convert(R C::*p) {
        if (p) {
            return ::Catch::Detail::rawMemoryToString(p);
        } else {
            return "nullptr";
        }
    }
};

#if defined(_MANAGED)
template <typename T>
struct StringMaker<T ^> {
    static std::string convert(T ^ ref) { return ::Catch::Detail::clrReferenceToString(ref); }
};
#endif

namespace Detail {
template <typename InputIterator, typename Sentinel = InputIterator>
std::string rangeToString(InputIterator first, Sentinel last) {
    ReusableStringStream rss;
    rss << "{ ";
    if (first != last) {
        rss << ::Catch::Detail::stringify(*first);
        for (++first; first != last; ++first)
            rss << ", " << ::Catch::Detail::stringify(*first);
    }
    rss << " }";
    return rss.str();
}
}  // namespace Detail

#ifdef __OBJC__
template <>
struct StringMaker<NSString *> {
    static std::string convert(NSString *nsstring) {
        if (!nsstring)
            return "nil";
        return std::string("@") + [nsstring UTF8String];
    }
};
template <>
struct StringMaker<NSObject *> {
    static std::string convert(NSObject *nsObject) {
        return ::Catch::Detail::stringify([nsObject description]);
    }
};
namespace Detail {
inline std::string stringify(NSString *nsstring) {
    return StringMaker<NSString *>::convert(nsstring);
}

}  // namespace Detail
#endif  // __OBJC__

}  // namespace Catch

//////////////////////////////////////////////////////
// Separate std-lib types stringification, so it can be selectively enabled
// This means that we do not bring in

#if defined(CATCH_CONFIG_ENABLE_ALL_STRINGMAKERS)
#define CATCH_CONFIG_ENABLE_PAIR_STRINGMAKER
#define CATCH_CONFIG_ENABLE_TUPLE_STRINGMAKER
#define CATCH_CONFIG_ENABLE_VARIANT_STRINGMAKER
#define CATCH_CONFIG_ENABLE_CHRONO_STRINGMAKER
#define CATCH_CONFIG_ENABLE_OPTIONAL_STRINGMAKER
#endif

// Separate std::pair specialization
#if defined(CATCH_CONFIG_ENABLE_PAIR_STRINGMAKER)
#include <utility>
namespace Catch {
template <typename T1, typename T2>
struct StringMaker<std::pair<T1, T2>> {
    static std::string convert(const std::pair<T1, T2> &pair) {
        ReusableStringStream rss;
        rss << "{ " << ::Catch::Detail::stringify(pair.first) << ", "
            << ::Catch::Detail::stringify(pair.second) << " }";
        return rss.str();
    }
};
}  // namespace Catch
#endif  // CATCH_CONFIG_ENABLE_PAIR_STRINGMAKER

#if defined(CATCH_CONFIG_ENABLE_OPTIONAL_STRINGMAKER) && defined(CATCH_CONFIG_CPP17_OPTIONAL)
#include <optional>
namespace Catch {
template <typename T>
struct StringMaker<std::optional<T>> {
    static std::string convert(const std::optional<T> &optional) {
        ReusableStringStream rss;
        if (optional.has_value()) {
            rss << ::Catch::Detail::stringify(*optional);
        } else {
            rss << "{ }";
        }
        return rss.str();
    }
};
}  // namespace Catch
#endif  // CATCH_CONFIG_ENABLE_OPTIONAL_STRINGMAKER

// Separate std::tuple specialization
#if defined(CATCH_CONFIG_ENABLE_TUPLE_STRINGMAKER)
#include <tuple>
namespace Catch {
namespace Detail {
template <typename Tuple, std::size_t N = 0, bool = (N < std::tuple_size<Tuple>::value)>
struct TupleElementPrinter {
    static void print(const Tuple &tuple, std::ostream &os) {
        os << (N ? ", " : " ") << ::Catch::Detail::stringify(std::get<N>(tuple));
        TupleElementPrinter<Tuple, N + 1>::print(tuple, os);
    }
};

template <typename Tuple, std::size_t N>
struct TupleElementPrinter<Tuple, N, false> {
    static void print(const Tuple &, std::ostream &) {}
};

}  // namespace Detail

template <typename... Types>
struct StringMaker<std::tuple<Types...>> {
    static std::string convert(const std::tuple<Types...> &tuple) {
        ReusableStringStream rss;
        rss << '{';
        Detail::TupleElementPrinter<std::tuple<Types...>>::print(tuple, rss.get());
        rss << " }";
        return rss.str();
    }
};
}  // namespace Catch
#endif  // CATCH_CONFIG_ENABLE_TUPLE_STRINGMAKER

#if defined(CATCH_CONFIG_ENABLE_VARIANT_STRINGMAKER) && defined(CATCH_CONFIG_CPP17_VARIANT)
#include <variant>
namespace Catch {
template <>
struct StringMaker<std::monostate> {
    static std::string convert(const std::monostate &) { return "{ }"; }
};

template <typename... Elements>
struct StringMaker<std::variant<Elements...>> {
    static std::string convert(const std::variant<Elements...> &variant) {
        if (variant.valueless_by_exception()) {
            return "{valueless variant}";
        } else {
            return std::visit([](const auto &value) { return ::Catch::Detail::stringify(value); },
                              variant);
        }
    }
};
}  // namespace Catch
#endif  // CATCH_CONFIG_ENABLE_VARIANT_STRINGMAKER

namespace Catch {
// Import begin/ end from std here
using std::begin;
using std::end;

namespace detail {
template <typename...>
struct void_type {
    using type = void;
};

template <typename T, typename = void>
struct is_range_impl : std::false_type {};

template <typename T>
struct is_range_impl<T, typename void_type<decltype(begin(std::declval<T>()))>::type>
        : std::true_type {};
}  // namespace detail

template <typename T>
struct is_range : detail::is_range_impl<T> {};

#if defined(_MANAGED)  // Managed types are never ranges
template <typename T>
struct is_range<T ^> {
    static const bool value = false;
};
#endif

template <typename Range>
std::string rangeToString(Range const &range) {
    return ::Catch::Detail::rangeToString(begin(range), end(range));
}

// Handle vector<bool> specially
template <typename Allocator>
std::string rangeToString(std::vector<bool, Allocator> const &v) {
    ReusableStringStream rss;
    rss << "{ ";
    bool first = true;
    for (bool b : v) {
        if (first)
            first = false;
        else
            rss << ", ";
        rss << ::Catch::Detail::stringify(b);
    }
    rss << " }";
    return rss.str();
}

template <typename R>
struct StringMaker<R,
                   typename std::enable_if<is_range<R>::value &&
                                           !::Catch::Detail::IsStreamInsertable<R>::value>::type> {
    static std::string convert(R const &range) { return rangeToString(range); }
};

template <typename T, int SZ>
struct StringMaker<T[SZ]> {
    static std::string convert(T const (&arr)[SZ]) { return rangeToString(arr); }
};

}  // namespace Catch

// Separate std::chrono::duration specialization
#if defined(CATCH_CONFIG_ENABLE_CHRONO_STRINGMAKER)
#include <chrono>
#include <ctime>
#include <ratio>

namespace Catch {

template <class Ratio>
struct ratio_string {
    static std::string symbol();
};

template <class Ratio>
std::string ratio_string<Ratio>::symbol() {
    Catch::ReusableStringStream rss;
    rss << '[' << Ratio::num << '/' << Ratio::den << ']';
    return rss.str();
}
template <>
struct ratio_string<std::atto> {
    static std::string symbol();
};
template <>
struct ratio_string<std::femto> {
    static std::string symbol();
};
template <>
struct ratio_string<std::pico> {
    static std::string symbol();
};
template <>
struct ratio_string<std::nano> {
    static std::string symbol();
};
template <>
struct ratio_string<std::micro> {
    static std::string symbol();
};
template <>
struct ratio_string<std::milli> {
    static std::string symbol();
};

////////////
// std::chrono::duration specializations
template <typename Value, typename Ratio>
struct StringMaker<std::chrono::duration<Value, Ratio>> {
    static std::string convert(std::chrono::duration<Value, Ratio> const &duration) {
        ReusableStringStream rss;
        rss << duration.count() << ' ' << ratio_string<Ratio>::symbol() << 's';
        return rss.str();
    }
};
template <typename Value>
struct StringMaker<std::chrono::duration<Value, std::ratio<1>>> {
    static std::string convert(std::chrono::duration<Value, std::ratio<1>> const &duration) {
        ReusableStringStream rss;
        rss << duration.count() << " s";
        return rss.str();
    }
};
template <typename Value>
struct StringMaker<std::chrono::duration<Value, std::ratio<60>>> {
    static std::string convert(std::chrono::duration<Value, std::ratio<60>> const &duration) {
        ReusableStringStream rss;
        rss << duration.count() << " m";
        return rss.str();
    }
};
template <typename Value>
struct StringMaker<std::chrono::duration<Value, std::ratio<3600>>> {
    static std::string convert(std::chrono::duration<Value, std::ratio<3600>> const &duration) {
        ReusableStringStream rss;
        rss << duration.count() << " h";
        return rss.str();
    }
};

////////////
// std::chrono::time_point specialization
// Generic time_point cannot be specialized, only
// std::chrono::time_point<system_clock>
template <typename Clock, typename Duration>
struct StringMaker<std::chrono::time_point<Clock, Duration>> {
    static std::string convert(std::chrono::time_point<Clock, Duration> const &time_point) {
        return ::Catch::Detail::stringify(time_point.time_since_epoch()) + " since epoch";
    }
};
// std::chrono::time_point<system_clock> specialization
template <typename Duration>
struct StringMaker<std::chrono::time_point<std::chrono::system_clock, Duration>> {
    static std::string convert(
            std::chrono::time_point<std::chrono::system_clock, Duration> const &time_point) {
        auto converted = std::chrono::system_clock::to_time_t(time_point);

#ifdef _MSC_VER
        std::tm timeInfo = {};
        gmtime_s(&timeInfo, &converted);
#else
        std::tm *timeInfo = std::gmtime(&converted);
#endif

        auto const timeStampSize = sizeof("2017-01-16T17:06:45Z");
        char timeStamp[timeStampSize];
        const char *const fmt = "%Y-%m-%dT%H:%M:%SZ";

#ifdef _MSC_VER
        std::strftime(timeStamp, timeStampSize, fmt, &timeInfo);
#else
        std::strftime(timeStamp, timeStampSize, fmt, timeInfo);
#endif
        return std::string(timeStamp);
    }
};
}  // namespace Catch
#endif  // CATCH_CONFIG_ENABLE_CHRONO_STRINGMAKER

#define INTERNAL_CATCH_REGISTER_ENUM(enumName, ...)                                               \
    namespace Catch {                                                                             \
    template <>                                                                                   \
    struct StringMaker<enumName> {                                                                \
        static std::string convert(enumName value) {                                              \
            static const auto &enumInfo =                                                         \
                    ::Catch::getMutableRegistryHub().getMutableEnumValuesRegistry().registerEnum( \
                            #enumName, #__VA_ARGS__, {__VA_ARGS__});                              \
            return static_cast<std::string>(enumInfo.lookup(static_cast<int>(value)));            \
        }                                                                                         \
    };                                                                                            \
    }

#define CATCH_REGISTER_ENUM(enumName, ...) INTERNAL_CATCH_REGISTER_ENUM(enumName, __VA_ARGS__)

#ifdef _MSC_VER
#pragma warning(pop)
#endif

// end catch_tostring.h
#include <iosfwd>

#ifdef _MSC_VER
#pragma warning(push)
#pragma warning(disable : 4389)  // '==' : signed/unsigned mismatch
#pragma warning(disable : 4018)  // more "signed/unsigned mismatch"
#pragma warning(disable : 4312)  // Converting int to T* using reinterpret_cast \
                                 // (issue on x64 platform)
#pragma warning(disable : 4180)  // qualifier applied to function type has no meaning
#pragma warning(disable : 4800)  // Forcing result to true or false
#endif

namespace Catch {

struct ITransientExpression {
    auto isBinaryExpression() const -> bool { return m_isBinaryExpression; }
    auto getResult() const -> bool { return m_result; }
    virtual void streamReconstructedExpression(std::ostream &os) const = 0;

    ITransientExpression(bool isBinaryExpression, bool result)
            : m_isBinaryExpression(isBinaryExpression), m_result(result) {}

    // We don't actually need a virtual destructor, but many static analysers
    // complain if it's not here :-(
    virtual ~ITransientExpression();

    bool m_isBinaryExpression;
    bool m_result;
};

void formatReconstructedExpression(std::ostream &os,
                                   std::string const &lhs,
                                   StringRef op,
                                   std::string const &rhs);

template <typename LhsT, typename RhsT>
class BinaryExpr : public ITransientExpression {
    LhsT m_lhs;
    StringRef m_op;
    RhsT m_rhs;

    void streamReconstructedExpression(std::ostream &os) const override {
        formatReconstructedExpression(os, Catch::Detail::stringify(m_lhs), m_op,
                                      Catch::Detail::stringify(m_rhs));
    }

public:
    BinaryExpr(bool comparisonResult, LhsT lhs, StringRef op, RhsT rhs)
            : ITransientExpression{true, comparisonResult}, m_lhs(lhs), m_op(op), m_rhs(rhs) {}

    template <typename T>
    auto operator&&(T) const -> BinaryExpr<LhsT, RhsT const &> const {
        static_assert(always_false<T>::value,
                      "chained comparisons are not supported inside assertions, "
                      "wrap the expression inside parentheses, or decompose it");
    }

    template <typename T>
    auto operator||(T) const -> BinaryExpr<LhsT, RhsT const &> const {
        static_assert(always_false<T>::value,
                      "chained comparisons are not supported inside assertions, "
                      "wrap the expression inside parentheses, or decompose it");
    }

    template <typename T>
    auto operator==(T) const -> BinaryExpr<LhsT, RhsT const &> const {
        static_assert(always_false<T>::value,
                      "chained comparisons are not supported inside assertions, "
                      "wrap the expression inside parentheses, or decompose it");
    }

    template <typename T>
    auto operator!=(T) const -> BinaryExpr<LhsT, RhsT const &> const {
        static_assert(always_false<T>::value,
                      "chained comparisons are not supported inside assertions, "
                      "wrap the expression inside parentheses, or decompose it");
    }

    template <typename T>
    auto operator>(T) const -> BinaryExpr<LhsT, RhsT const &> const {
        static_assert(always_false<T>::value,
                      "chained comparisons are not supported inside assertions, "
                      "wrap the expression inside parentheses, or decompose it");
    }

    template <typename T>
    auto operator<(T) const -> BinaryExpr<LhsT, RhsT const &> const {
        static_assert(always_false<T>::value,
                      "chained comparisons are not supported inside assertions, "
                      "wrap the expression inside parentheses, or decompose it");
    }

    template <typename T>
    auto operator>=(T) const -> BinaryExpr<LhsT, RhsT const &> const {
        static_assert(always_false<T>::value,
                      "chained comparisons are not supported inside assertions, "
                      "wrap the expression inside parentheses, or decompose it");
    }

    template <typename T>
    auto operator<=(T) const -> BinaryExpr<LhsT, RhsT const &> const {
        static_assert(always_false<T>::value,
                      "chained comparisons are not supported inside assertions, "
                      "wrap the expression inside parentheses, or decompose it");
    }
};

template <typename LhsT>
class UnaryExpr : public ITransientExpression {
    LhsT m_lhs;

    void streamReconstructedExpression(std::ostream &os) const override {
        os << Catch::Detail::stringify(m_lhs);
    }

public:
    explicit UnaryExpr(LhsT lhs)
            : ITransientExpression{false, static_cast<bool>(lhs)}, m_lhs(lhs) {}
};

// Specialised comparison functions to handle equality comparisons between ints
// and pointers (NULL deduces as an int)
template <typename LhsT, typename RhsT>
auto compareEqual(LhsT const &lhs, RhsT const &rhs) -> bool {
    return static_cast<bool>(lhs == rhs);
}
template <typename T>
auto compareEqual(T *const &lhs, int rhs) -> bool {
    return lhs == reinterpret_cast<void const *>(rhs);
}
template <typename T>
auto compareEqual(T *const &lhs, long rhs) -> bool {
    return lhs == reinterpret_cast<void const *>(rhs);
}
template <typename T>
auto compareEqual(int lhs, T *const &rhs) -> bool {
    return reinterpret_cast<void const *>(lhs) == rhs;
}
template <typename T>
auto compareEqual(long lhs, T *const &rhs) -> bool {
    return reinterpret_cast<void const *>(lhs) == rhs;
}

template <typename LhsT, typename RhsT>
auto compareNotEqual(LhsT const &lhs, RhsT &&rhs) -> bool {
    return static_cast<bool>(lhs != rhs);
}
template <typename T>
auto compareNotEqual(T *const &lhs, int rhs) -> bool {
    return lhs != reinterpret_cast<void const *>(rhs);
}
template <typename T>
auto compareNotEqual(T *const &lhs, long rhs) -> bool {
    return lhs != reinterpret_cast<void const *>(rhs);
}
template <typename T>
auto compareNotEqual(int lhs, T *const &rhs) -> bool {
    return reinterpret_cast<void const *>(lhs) != rhs;
}
template <typename T>
auto compareNotEqual(long lhs, T *const &rhs) -> bool {
    return reinterpret_cast<void const *>(lhs) != rhs;
}

template <typename LhsT>
class ExprLhs {
    LhsT m_lhs;

public:
    explicit ExprLhs(LhsT lhs) : m_lhs(lhs) {}

    template <typename RhsT>
    auto operator==(RhsT const &rhs) -> BinaryExpr<LhsT, RhsT const &> const {
        return {compareEqual(m_lhs, rhs), m_lhs, "==", rhs};
    }
    auto operator==(bool rhs) -> BinaryExpr<LhsT, bool> const {
        return {m_lhs == rhs, m_lhs, "==", rhs};
    }

    template <typename RhsT>
    auto operator!=(RhsT const &rhs) -> BinaryExpr<LhsT, RhsT const &> const {
        return {compareNotEqual(m_lhs, rhs), m_lhs, "!=", rhs};
    }
    auto operator!=(bool rhs) -> BinaryExpr<LhsT, bool> const {
        return {m_lhs != rhs, m_lhs, "!=", rhs};
    }

    template <typename RhsT>
    auto operator>(RhsT const &rhs) -> BinaryExpr<LhsT, RhsT const &> const {
        return {static_cast<bool>(m_lhs > rhs), m_lhs, ">", rhs};
    }
    template <typename RhsT>
    auto operator<(RhsT const &rhs) -> BinaryExpr<LhsT, RhsT const &> const {
        return {static_cast<bool>(m_lhs < rhs), m_lhs, "<", rhs};
    }
    template <typename RhsT>
    auto operator>=(RhsT const &rhs) -> BinaryExpr<LhsT, RhsT const &> const {
        return {static_cast<bool>(m_lhs >= rhs), m_lhs, ">=", rhs};
    }
    template <typename RhsT>
    auto operator<=(RhsT const &rhs) -> BinaryExpr<LhsT, RhsT const &> const {
        return {static_cast<bool>(m_lhs <= rhs), m_lhs, "<=", rhs};
    }
    template <typename RhsT>
    auto operator|(RhsT const &rhs) -> BinaryExpr<LhsT, RhsT const &> const {
        return {static_cast<bool>(m_lhs | rhs), m_lhs, "|", rhs};
    }
    template <typename RhsT>
    auto operator&(RhsT const &rhs) -> BinaryExpr<LhsT, RhsT const &> const {
        return {static_cast<bool>(m_lhs & rhs), m_lhs, "&", rhs};
    }
    template <typename RhsT>
    auto operator^(RhsT const &rhs) -> BinaryExpr<LhsT, RhsT const &> const {
        return {static_cast<bool>(m_lhs ^ rhs), m_lhs, "^", rhs};
    }

    template <typename RhsT>
    auto operator&&(RhsT const &) -> BinaryExpr<LhsT, RhsT const &> const {
        static_assert(always_false<RhsT>::value,
                      "operator&& is not supported inside assertions, "
                      "wrap the expression inside parentheses, or decompose it");
    }

    template <typename RhsT>
    auto operator||(RhsT const &) -> BinaryExpr<LhsT, RhsT const &> const {
        static_assert(always_false<RhsT>::value,
                      "operator|| is not supported inside assertions, "
                      "wrap the expression inside parentheses, or decompose it");
    }

    auto makeUnaryExpr() const -> UnaryExpr<LhsT> { return UnaryExpr<LhsT>{m_lhs}; }
};

void handleExpression(ITransientExpression const &expr);

template <typename T>
void handleExpression(ExprLhs<T> const &expr) {
    handleExpression(expr.makeUnaryExpr());
}

struct Decomposer {
    template <typename T>
    auto operator<=(T const &lhs) -> ExprLhs<T const &> {
        return ExprLhs<T const &>{lhs};
    }

    auto operator<=(bool value) -> ExprLhs<bool> { return ExprLhs<bool>{value}; }
};

}  // end namespace Catch

#ifdef _MSC_VER
#pragma warning(pop)
#endif

// end catch_decomposer.h
// start catch_interfaces_capture.h

#include <chrono>
#include <string>

namespace Catch {

class AssertionResult;
struct AssertionInfo;
struct SectionInfo;
struct SectionEndInfo;
struct MessageInfo;
struct MessageBuilder;
struct Counts;
struct AssertionReaction;
struct SourceLineInfo;

struct ITransientExpression;
struct IGeneratorTracker;

#if defined(CATCH_CONFIG_ENABLE_BENCHMARKING)
struct BenchmarkInfo;
template <typename Duration = std::chrono::duration<double, std::nano>>
struct BenchmarkStats;
#endif  // CATCH_CONFIG_ENABLE_BENCHMARKING

struct IResultCapture {
    virtual ~IResultCapture();

    virtual bool sectionStarted(SectionInfo const &sectionInfo, Counts &assertions) = 0;
    virtual void sectionEnded(SectionEndInfo const &endInfo) = 0;
    virtual void sectionEndedEarly(SectionEndInfo const &endInfo) = 0;

    virtual auto acquireGeneratorTracker(StringRef generatorName, SourceLineInfo const &lineInfo)
            -> IGeneratorTracker & = 0;

#if defined(CATCH_CONFIG_ENABLE_BENCHMARKING)
    virtual void benchmarkPreparing(std::string const &name) = 0;
    virtual void benchmarkStarting(BenchmarkInfo const &info) = 0;
    virtual void benchmarkEnded(BenchmarkStats<> const &stats) = 0;
    virtual void benchmarkFailed(std::string const &error) = 0;
#endif  // CATCH_CONFIG_ENABLE_BENCHMARKING

    virtual void pushScopedMessage(MessageInfo const &message) = 0;
    virtual void popScopedMessage(MessageInfo const &message) = 0;

    virtual void emplaceUnscopedMessage(MessageBuilder const &builder) = 0;

    virtual void handleFatalErrorCondition(StringRef message) = 0;

    virtual void handleExpr(AssertionInfo const &info,
                            ITransientExpression const &expr,
                            AssertionReaction &reaction) = 0;
    virtual void handleMessage(AssertionInfo const &info,
                               ResultWas::OfType resultType,
                               StringRef const &message,
                               AssertionReaction &reaction) = 0;
    virtual void handleUnexpectedExceptionNotThrown(AssertionInfo const &info,
                                                    AssertionReaction &reaction) = 0;
    virtual void handleUnexpectedInflightException(AssertionInfo const &info,
                                                   std::string const &message,
                                                   AssertionReaction &reaction) = 0;
    virtual void handleIncomplete(AssertionInfo const &info) = 0;
    virtual void handleNonExpr(AssertionInfo const &info,
                               ResultWas::OfType resultType,
                               AssertionReaction &reaction) = 0;

    virtual bool lastAssertionPassed() = 0;
    virtual void assertionPassed() = 0;

    // Deprecated, do not use:
    virtual std::string getCurrentTestName() const = 0;
    virtual const AssertionResult *getLastResult() const = 0;
    virtual void exceptionEarlyReported() = 0;
};

IResultCapture &getResultCapture();
}  // namespace Catch

// end catch_interfaces_capture.h
namespace Catch {

struct TestFailureException {};
struct AssertionResultData;
struct IResultCapture;
class RunContext;

class LazyExpression {
    friend class AssertionHandler;
    friend struct AssertionStats;
    friend class RunContext;

    ITransientExpression const *m_transientExpression = nullptr;
    bool m_isNegated;

public:
    LazyExpression(bool isNegated);
    LazyExpression(LazyExpression const &other);
    LazyExpression &operator=(LazyExpression const &) = delete;

    explicit operator bool() const;

    friend auto operator<<(std::ostream &os, LazyExpression const &lazyExpr) -> std::ostream &;
};

struct AssertionReaction {
    bool shouldDebugBreak = false;
    bool shouldThrow = false;
};

class AssertionHandler {
    AssertionInfo m_assertionInfo;
    AssertionReaction m_reaction;
    bool m_completed = false;
    IResultCapture &m_resultCapture;

public:
    AssertionHandler(StringRef const &macroName,
                     SourceLineInfo const &lineInfo,
                     StringRef capturedExpression,
                     ResultDisposition::Flags resultDisposition);
    ~AssertionHandler() {
        if (!m_completed) {
            m_resultCapture.handleIncomplete(m_assertionInfo);
        }
    }

    template <typename T>
    void handleExpr(ExprLhs<T> const &expr) {
        handleExpr(expr.makeUnaryExpr());
    }
    void handleExpr(ITransientExpression const &expr);

    void handleMessage(ResultWas::OfType resultType, StringRef const &message);

    void handleExceptionThrownAsExpected();
    void handleUnexpectedExceptionNotThrown();
    void handleExceptionNotThrownAsExpected();
    void handleThrowingCallSkipped();
    void handleUnexpectedInflightException();

    void complete();
    void setCompleted();

    // query
    auto allowThrows() const -> bool;
};

void handleExceptionMatchExpr(AssertionHandler &handler,
                              std::string const &str,
                              StringRef const &matcherString);

}  // namespace Catch

// end catch_assertionhandler.h
// start catch_message.h

#include <string>
#include <vector>

namespace Catch {

struct MessageInfo {
    MessageInfo(StringRef const &_macroName,
                SourceLineInfo const &_lineInfo,
                ResultWas::OfType _type);

    StringRef macroName;
    std::string message;
    SourceLineInfo lineInfo;
    ResultWas::OfType type;
    unsigned int sequence;

    bool operator==(MessageInfo const &other) const;
    bool operator<(MessageInfo const &other) const;

private:
    static unsigned int globalCount;
};

struct MessageStream {
    template <typename T>
    MessageStream &operator<<(T const &value) {
        m_stream << value;
        return *this;
    }

    ReusableStringStream m_stream;
};

struct MessageBuilder : MessageStream {
    MessageBuilder(StringRef const &macroName,
                   SourceLineInfo const &lineInfo,
                   ResultWas::OfType type);

    template <typename T>
    MessageBuilder &operator<<(T const &value) {
        m_stream << value;
        return *this;
    }

    MessageInfo m_info;
};

class ScopedMessage {
public:
    explicit ScopedMessage(MessageBuilder const &builder);
    ScopedMessage(ScopedMessage &duplicate) = delete;
    ScopedMessage(ScopedMessage &&old);
    ~ScopedMessage();

    MessageInfo m_info;
    bool m_moved;
};

class Capturer {
    std::vector<MessageInfo> m_messages;
    IResultCapture &m_resultCapture = getResultCapture();
    size_t m_captured = 0;

public:
    Capturer(StringRef macroName,
             SourceLineInfo const &lineInfo,
             ResultWas::OfType resultType,
             StringRef names);
    ~Capturer();

    void captureValue(size_t index, std::string const &value);

    template <typename T>
    void captureValues(size_t index, T const &value) {
        captureValue(index, Catch::Detail::stringify(value));
    }

    template <typename T, typename... Ts>
    void captureValues(size_t index, T const &value, Ts const &...values) {
        captureValue(index, Catch::Detail::stringify(value));
        captureValues(index + 1, values...);
    }
};

}  // end namespace Catch

// end catch_message.h
#if !defined(CATCH_CONFIG_DISABLE)

#if !defined(CATCH_CONFIG_DISABLE_STRINGIFICATION)
#define CATCH_INTERNAL_STRINGIFY(...) #__VA_ARGS__
#else
#define CATCH_INTERNAL_STRINGIFY(...) "Disabled by CATCH_CONFIG_DISABLE_STRINGIFICATION"
#endif

#if defined(CATCH_CONFIG_FAST_COMPILE) || defined(CATCH_CONFIG_DISABLE_EXCEPTIONS)

///////////////////////////////////////////////////////////////////////////////
// Another way to speed-up compilation is to omit local try-catch for REQUIRE*
// macros.
#define INTERNAL_CATCH_TRY
#define INTERNAL_CATCH_CATCH(capturer)

#else  // CATCH_CONFIG_FAST_COMPILE

#define INTERNAL_CATCH_TRY try
#define INTERNAL_CATCH_CATCH(handler)                \
    catch (...) {                                    \
        handler.handleUnexpectedInflightException(); \
    }

#endif

#define INTERNAL_CATCH_REACT(handler) handler.complete();

///////////////////////////////////////////////////////////////////////////////
#define INTERNAL_CATCH_TEST(macroName, resultDisposition, ...)                    \
    do {                                                                          \
        CATCH_INTERNAL_IGNORE_BUT_WARN(__VA_ARGS__);                              \
        Catch::AssertionHandler catchAssertionHandler(                            \
                macroName##_catch_sr, CATCH_INTERNAL_LINEINFO,                    \
                CATCH_INTERNAL_STRINGIFY(__VA_ARGS__), resultDisposition);        \
        INTERNAL_CATCH_TRY {                                                      \
            CATCH_INTERNAL_START_WARNINGS_SUPPRESSION                             \
            CATCH_INTERNAL_SUPPRESS_PARENTHESES_WARNINGS                          \
            catchAssertionHandler.handleExpr(Catch::Decomposer() <= __VA_ARGS__); \
            CATCH_INTERNAL_STOP_WARNINGS_SUPPRESSION                              \
        }                                                                         \
        INTERNAL_CATCH_CATCH(catchAssertionHandler)                               \
        INTERNAL_CATCH_REACT(catchAssertionHandler)                               \
    } while ((void)0, (false) && static_cast<bool>(!!(__VA_ARGS__)))

///////////////////////////////////////////////////////////////////////////////
#define INTERNAL_CATCH_IF(macroName, resultDisposition, ...)        \
    INTERNAL_CATCH_TEST(macroName, resultDisposition, __VA_ARGS__); \
    if (Catch::getResultCapture().lastAssertionPassed())

///////////////////////////////////////////////////////////////////////////////
#define INTERNAL_CATCH_ELSE(macroName, resultDisposition, ...)      \
    INTERNAL_CATCH_TEST(macroName, resultDisposition, __VA_ARGS__); \
    if (!Catch::getResultCapture().lastAssertionPassed())

///////////////////////////////////////////////////////////////////////////////
#define INTERNAL_CATCH_NO_THROW(macroName, resultDisposition, ...)         \
    do {                                                                   \
        Catch::AssertionHandler catchAssertionHandler(                     \
                macroName##_catch_sr, CATCH_INTERNAL_LINEINFO,             \
                CATCH_INTERNAL_STRINGIFY(__VA_ARGS__), resultDisposition); \
        try {                                                              \
            static_cast<void>(__VA_ARGS__);                                \
            catchAssertionHandler.handleExceptionNotThrownAsExpected();    \
        } catch (...) {                                                    \
            catchAssertionHandler.handleUnexpectedInflightException();     \
        }                                                                  \
        INTERNAL_CATCH_REACT(catchAssertionHandler)                        \
    } while (false)

///////////////////////////////////////////////////////////////////////////////
#define INTERNAL_CATCH_THROWS(macroName, resultDisposition, ...)            \
    do {                                                                    \
        Catch::AssertionHandler catchAssertionHandler(                      \
                macroName##_catch_sr, CATCH_INTERNAL_LINEINFO,              \
                CATCH_INTERNAL_STRINGIFY(__VA_ARGS__), resultDisposition);  \
        if (catchAssertionHandler.allowThrows())                            \
            try {                                                           \
                static_cast<void>(__VA_ARGS__);                             \
                catchAssertionHandler.handleUnexpectedExceptionNotThrown(); \
            } catch (...) {                                                 \
                catchAssertionHandler.handleExceptionThrownAsExpected();    \
            }                                                               \
        else                                                                \
            catchAssertionHandler.handleThrowingCallSkipped();              \
        INTERNAL_CATCH_REACT(catchAssertionHandler)                         \
    } while (false)

///////////////////////////////////////////////////////////////////////////////
#define INTERNAL_CATCH_THROWS_AS(macroName, exceptionType, resultDisposition, expr)          \
    do {                                                                                     \
        Catch::AssertionHandler catchAssertionHandler(                                       \
                macroName##_catch_sr, CATCH_INTERNAL_LINEINFO,                               \
                CATCH_INTERNAL_STRINGIFY(expr) ", " CATCH_INTERNAL_STRINGIFY(exceptionType), \
                resultDisposition);                                                          \
        if (catchAssertionHandler.allowThrows())                                             \
            try {                                                                            \
                static_cast<void>(expr);                                                     \
                catchAssertionHandler.handleUnexpectedExceptionNotThrown();                  \
            } catch (exceptionType const &) {                                                \
                catchAssertionHandler.handleExceptionThrownAsExpected();                     \
            } catch (...) {                                                                  \
                catchAssertionHandler.handleUnexpectedInflightException();                   \
            }                                                                                \
        else                                                                                 \
            catchAssertionHandler.handleThrowingCallSkipped();                               \
        INTERNAL_CATCH_REACT(catchAssertionHandler)                                          \
    } while (false)

///////////////////////////////////////////////////////////////////////////////
#define INTERNAL_CATCH_MSG(macroName, messageType, resultDisposition, ...)                         \
    do {                                                                                           \
        Catch::AssertionHandler catchAssertionHandler(macroName##_catch_sr,                        \
                                                      CATCH_INTERNAL_LINEINFO, Catch::StringRef(), \
                                                      resultDisposition);                          \
        catchAssertionHandler.handleMessage(                                                       \
                messageType, (Catch::MessageStream() << __VA_ARGS__ + ::Catch::StreamEndStop())    \
                                     .m_stream.str());                                             \
        INTERNAL_CATCH_REACT(catchAssertionHandler)                                                \
    } while (false)

///////////////////////////////////////////////////////////////////////////////
#define INTERNAL_CATCH_CAPTURE(varName, macroName, ...)                                        \
    auto varName = Catch::Capturer(macroName, CATCH_INTERNAL_LINEINFO, Catch::ResultWas::Info, \
                                   #__VA_ARGS__);                                              \
    varName.captureValues(0, __VA_ARGS__)

///////////////////////////////////////////////////////////////////////////////
#define INTERNAL_CATCH_INFO(macroName, log)                                      \
    Catch::ScopedMessage INTERNAL_CATCH_UNIQUE_NAME(scopedMessage)(              \
            Catch::MessageBuilder(macroName##_catch_sr, CATCH_INTERNAL_LINEINFO, \
                                  Catch::ResultWas::Info)                        \
            << log);

///////////////////////////////////////////////////////////////////////////////
#define INTERNAL_CATCH_UNSCOPED_INFO(macroName, log)                             \
    Catch::getResultCapture().emplaceUnscopedMessage(                            \
            Catch::MessageBuilder(macroName##_catch_sr, CATCH_INTERNAL_LINEINFO, \
                                  Catch::ResultWas::Info)                        \
            << log)

///////////////////////////////////////////////////////////////////////////////
// Although this is matcher-based, it can be used with just a string
#define INTERNAL_CATCH_THROWS_STR_MATCHES(macroName, resultDisposition, matcher, ...)         \
    do {                                                                                      \
        Catch::AssertionHandler catchAssertionHandler(                                        \
                macroName##_catch_sr, CATCH_INTERNAL_LINEINFO,                                \
                CATCH_INTERNAL_STRINGIFY(__VA_ARGS__) ", " CATCH_INTERNAL_STRINGIFY(matcher), \
                resultDisposition);                                                           \
        if (catchAssertionHandler.allowThrows())                                              \
            try {                                                                             \
                static_cast<void>(__VA_ARGS__);                                               \
                catchAssertionHandler.handleUnexpectedExceptionNotThrown();                   \
            } catch (...) {                                                                   \
                Catch::handleExceptionMatchExpr(catchAssertionHandler, matcher,               \
                                                #matcher##_catch_sr);                         \
            }                                                                                 \
        else                                                                                  \
            catchAssertionHandler.handleThrowingCallSkipped();                                \
        INTERNAL_CATCH_REACT(catchAssertionHandler)                                           \
    } while (false)

#endif  // CATCH_CONFIG_DISABLE

// end catch_capture.hpp
// start catch_section.h

// start catch_section_info.h

// start catch_totals.h

#include <cstddef>

namespace Catch {

struct Counts {
    Counts operator-(Counts const &other) const;
    Counts &operator+=(Counts const &other);

    std::size_t total() const;
    bool allPassed() const;
    bool allOk() const;

    std::size_t passed = 0;
    std::size_t failed = 0;
    std::size_t failedButOk = 0;
};

struct Totals {
    Totals operator-(Totals const &other) const;
    Totals &operator+=(Totals const &other);

    Totals delta(Totals const &prevTotals) const;

    int error = 0;
    Counts assertions;
    Counts testCases;
};
}  // namespace Catch

// end catch_totals.h
#include <string>

namespace Catch {

struct SectionInfo {
    SectionInfo(SourceLineInfo const &_lineInfo, std::string const &_name);

    // Deprecated
    SectionInfo(SourceLineInfo const &_lineInfo, std::string const &_name, std::string const &)
            : SectionInfo(_lineInfo, _name) {}

    std::string name;
    std::string description;  // !Deprecated: this will always be empty
    SourceLineInfo lineInfo;
};

struct SectionEndInfo {
    SectionInfo sectionInfo;
    Counts prevAssertions;
    double durationInSeconds;
};

}  // end namespace Catch

// end catch_section_info.h
// start catch_timer.h

#include <cstdint>

namespace Catch {

auto getCurrentNanosecondsSinceEpoch() -> uint64_t;
auto getEstimatedClockResolution() -> uint64_t;

class Timer {
    uint64_t m_nanoseconds = 0;

public:
    void start();
    auto getElapsedNanoseconds() const -> uint64_t;
    auto getElapsedMicroseconds() const -> uint64_t;
    auto getElapsedMilliseconds() const -> unsigned int;
    auto getElapsedSeconds() const -> double;
};

}  // namespace Catch

// end catch_timer.h
#include <string>

namespace Catch {

class Section : NonCopyable {
public:
    Section(SectionInfo const &info);
    ~Section();

    // This indicates whether the section should be executed or not
    explicit operator bool() const;

private:
    SectionInfo m_info;

    std::string m_name;
    Counts m_assertions;
    bool m_sectionIncluded;
    Timer m_timer;
};

}  // end namespace Catch

#define INTERNAL_CATCH_SECTION(...)                                                \
    CATCH_INTERNAL_START_WARNINGS_SUPPRESSION                                      \
    CATCH_INTERNAL_SUPPRESS_UNUSED_WARNINGS                                        \
    if (Catch::Section const &INTERNAL_CATCH_UNIQUE_NAME(catch_internal_Section) = \
                Catch::SectionInfo(CATCH_INTERNAL_LINEINFO, __VA_ARGS__))          \
    CATCH_INTERNAL_STOP_WARNINGS_SUPPRESSION

#define INTERNAL_CATCH_DYNAMIC_SECTION(...)                                               \
    CATCH_INTERNAL_START_WARNINGS_SUPPRESSION                                             \
    CATCH_INTERNAL_SUPPRESS_UNUSED_WARNINGS                                               \
    if (Catch::Section const &INTERNAL_CATCH_UNIQUE_NAME(catch_internal_Section) =        \
                Catch::SectionInfo(CATCH_INTERNAL_LINEINFO,                               \
                                   (Catch::ReusableStringStream() << __VA_ARGS__).str())) \
    CATCH_INTERNAL_STOP_WARNINGS_SUPPRESSION

// end catch_section.h
// start catch_interfaces_exception.h

// start catch_interfaces_registry_hub.h

#include <memory>
#include <string>

namespace Catch {

class TestCase;
struct ITestCaseRegistry;
struct IExceptionTranslatorRegistry;
struct IExceptionTranslator;
struct IReporterRegistry;
struct IReporterFactory;
struct ITagAliasRegistry;
struct IMutableEnumValuesRegistry;

class StartupExceptionRegistry;

using IReporterFactoryPtr = std::shared_ptr<IReporterFactory>;

struct IRegistryHub {
    virtual ~IRegistryHub();

    virtual IReporterRegistry const &getReporterRegistry() const = 0;
    virtual ITestCaseRegistry const &getTestCaseRegistry() const = 0;
    virtual ITagAliasRegistry const &getTagAliasRegistry() const = 0;
    virtual IExceptionTranslatorRegistry const &getExceptionTranslatorRegistry() const = 0;

    virtual StartupExceptionRegistry const &getStartupExceptionRegistry() const = 0;
};

struct IMutableRegistryHub {
    virtual ~IMutableRegistryHub();
    virtual void registerReporter(std::string const &name, IReporterFactoryPtr const &factory) = 0;
    virtual void registerListener(IReporterFactoryPtr const &factory) = 0;
    virtual void registerTest(TestCase const &testInfo) = 0;
    virtual void registerTranslator(const IExceptionTranslator *translator) = 0;
    virtual void registerTagAlias(std::string const &alias,
                                  std::string const &tag,
                                  SourceLineInfo const &lineInfo) = 0;
    virtual void registerStartupException() noexcept = 0;
    virtual IMutableEnumValuesRegistry &getMutableEnumValuesRegistry() = 0;
};

IRegistryHub const &getRegistryHub();
IMutableRegistryHub &getMutableRegistryHub();
void cleanUp();
std::string translateActiveException();

}  // namespace Catch

// end catch_interfaces_registry_hub.h
#if defined(CATCH_CONFIG_DISABLE)
#define INTERNAL_CATCH_TRANSLATE_EXCEPTION_NO_REG(translatorName, signature) \
    static std::string translatorName(signature)
#endif

#include <exception>
#include <string>
#include <vector>

namespace Catch {
using exceptionTranslateFunction = std::string (*)();

struct IExceptionTranslator;
using ExceptionTranslators = std::vector<std::unique_ptr<IExceptionTranslator const>>;

struct IExceptionTranslator {
    virtual ~IExceptionTranslator();
    virtual std::string translate(ExceptionTranslators::const_iterator it,
                                  ExceptionTranslators::const_iterator itEnd) const = 0;
};

struct IExceptionTranslatorRegistry {
    virtual ~IExceptionTranslatorRegistry();

    virtual std::string translateActiveException() const = 0;
};

class ExceptionTranslatorRegistrar {
    template <typename T>
    class ExceptionTranslator : public IExceptionTranslator {
    public:
        ExceptionTranslator(std::string (*translateFunction)(T &))
                : m_translateFunction(translateFunction) {}

        std::string translate(ExceptionTranslators::const_iterator it,
                              ExceptionTranslators::const_iterator itEnd) const override {
#if defined(CATCH_CONFIG_DISABLE_EXCEPTIONS)
            return "";
#else
            try {
                if (it == itEnd)
                    std::rethrow_exception(std::current_exception());
                else
                    return (*it)->translate(it + 1, itEnd);
            } catch (T &ex) {
                return m_translateFunction(ex);
            }
#endif
        }

    protected:
        std::string (*m_translateFunction)(T &);
    };

public:
    template <typename T>
    ExceptionTranslatorRegistrar(std::string (*translateFunction)(T &)) {
        getMutableRegistryHub().registerTranslator(new ExceptionTranslator<T>(translateFunction));
    }
};
}  // namespace Catch

///////////////////////////////////////////////////////////////////////////////
#define INTERNAL_CATCH_TRANSLATE_EXCEPTION2(translatorName, signature) \
    static std::string translatorName(signature);                      \
    CATCH_INTERNAL_START_WARNINGS_SUPPRESSION                          \
    CATCH_INTERNAL_SUPPRESS_GLOBALS_WARNINGS                           \
    namespace {                                                        \
    Catch::ExceptionTranslatorRegistrar INTERNAL_CATCH_UNIQUE_NAME(    \
            catch_internal_ExceptionRegistrar)(&translatorName);       \
    }                                                                  \
    CATCH_INTERNAL_STOP_WARNINGS_SUPPRESSION                           \
    static std::string translatorName(signature)

#define INTERNAL_CATCH_TRANSLATE_EXCEPTION(signature) \
    INTERNAL_CATCH_TRANSLATE_EXCEPTION2(              \
            INTERNAL_CATCH_UNIQUE_NAME(catch_internal_ExceptionTranslator), signature)

// end catch_interfaces_exception.h
// start catch_approx.h

#include <type_traits>

namespace Catch {
namespace Detail {

class Approx {
private:
    bool equalityComparisonImpl(double other) const;
    // Validates the new margin (margin >= 0)
    // out-of-line to avoid including stdexcept in the header
    void setMargin(double margin);
    // Validates the new epsilon (0 < epsilon < 1)
    // out-of-line to avoid including stdexcept in the header
    void setEpsilon(double epsilon);

public:
    explicit Approx(double value);

    static Approx custom();

    Approx operator-() const;

    template <typename T,
              typename = typename std::enable_if<std::is_constructible<double, T>::value>::type>
    Approx operator()(T const &value) {
        Approx approx(static_cast<double>(value));
        approx.m_epsilon = m_epsilon;
        approx.m_margin = m_margin;
        approx.m_scale = m_scale;
        return approx;
    }

    template <typename T,
              typename = typename std::enable_if<std::is_constructible<double, T>::value>::type>
    explicit Approx(T const &value) : Approx(static_cast<double>(value)) {}

    template <typename T,
              typename = typename std::enable_if<std::is_constructible<double, T>::value>::type>
    friend bool operator==(const T &lhs, Approx const &rhs) {
        auto lhs_v = static_cast<double>(lhs);
        return rhs.equalityComparisonImpl(lhs_v);
    }

    template <typename T,
              typename = typename std::enable_if<std::is_constructible<double, T>::value>::type>
    friend bool operator==(Approx const &lhs, const T &rhs) {
        return operator==(rhs, lhs);
    }

    template <typename T,
              typename = typename std::enable_if<std::is_constructible<double, T>::value>::type>
    friend bool operator!=(T const &lhs, Approx const &rhs) {
        return !operator==(lhs, rhs);
    }

    template <typename T,
              typename = typename std::enable_if<std::is_constructible<double, T>::value>::type>
    friend bool operator!=(Approx const &lhs, T const &rhs) {
        return !operator==(rhs, lhs);
    }

    template <typename T,
              typename = typename std::enable_if<std::is_constructible<double, T>::value>::type>
    friend bool operator<=(T const &lhs, Approx const &rhs) {
        return static_cast<double>(lhs) < rhs.m_value || lhs == rhs;
    }

    template <typename T,
              typename = typename std::enable_if<std::is_constructible<double, T>::value>::type>
    friend bool operator<=(Approx const &lhs, T const &rhs) {
        return lhs.m_value < static_cast<double>(rhs) || lhs == rhs;
    }

    template <typename T,
              typename = typename std::enable_if<std::is_constructible<double, T>::value>::type>
    friend bool operator>=(T const &lhs, Approx const &rhs) {
        return static_cast<double>(lhs) > rhs.m_value || lhs == rhs;
    }

    template <typename T,
              typename = typename std::enable_if<std::is_constructible<double, T>::value>::type>
    friend bool operator>=(Approx const &lhs, T const &rhs) {
        return lhs.m_value > static_cast<double>(rhs) || lhs == rhs;
    }

    template <typename T,
              typename = typename std::enable_if<std::is_constructible<double, T>::value>::type>
    Approx &epsilon(T const &newEpsilon) {
        double epsilonAsDouble = static_cast<double>(newEpsilon);
        setEpsilon(epsilonAsDouble);
        return *this;
    }

    template <typename T,
              typename = typename std::enable_if<std::is_constructible<double, T>::value>::type>
    Approx &margin(T const &newMargin) {
        double marginAsDouble = static_cast<double>(newMargin);
        setMargin(marginAsDouble);
        return *this;
    }

    template <typename T,
              typename = typename std::enable_if<std::is_constructible<double, T>::value>::type>
    Approx &scale(T const &newScale) {
        m_scale = static_cast<double>(newScale);
        return *this;
    }

    std::string toString() const;

private:
    double m_epsilon;
    double m_margin;
    double m_scale;
    double m_value;
};
}  // end namespace Detail

namespace literals {
Detail::Approx operator"" _a(long double val);
Detail::Approx operator"" _a(unsigned long long val);
}  // end namespace literals

template <>
struct StringMaker<Catch::Detail::Approx> {
    static std::string convert(Catch::Detail::Approx const &value);
};

}  // end namespace Catch

// end catch_approx.h
// start catch_string_manip.h

#include <iosfwd>
#include <string>
#include <vector>

namespace Catch {

bool startsWith(std::string const &s, std::string const &prefix);
bool startsWith(std::string const &s, char prefix);
bool endsWith(std::string const &s, std::string const &suffix);
bool endsWith(std::string const &s, char suffix);
bool contains(std::string const &s, std::string const &infix);
void toLowerInPlace(std::string &s);
std::string toLower(std::string const &s);
//! Returns a new string without whitespace at the start/end
std::string trim(std::string const &str);
//! Returns a substring of the original ref without whitespace. Beware
//! lifetimes!
StringRef trim(StringRef ref);

// !!! Be aware, returns refs into original string - make sure original string
// outlives them
std::vector<StringRef> splitStringRef(StringRef str, char delimiter);
bool replaceInPlace(std::string &str, std::string const &replaceThis, std::string const &withThis);

struct pluralise {
    pluralise(std::size_t count, std::string const &label);

    friend std::ostream &operator<<(std::ostream &os, pluralise const &pluraliser);

    std::size_t m_count;
    std::string m_label;
};
}  // namespace Catch

// end catch_string_manip.h
#ifndef CATCH_CONFIG_DISABLE_MATCHERS
// start catch_capture_matchers.h

// start catch_matchers.h

#include <string>
#include <vector>

namespace Catch {
namespace Matchers {
namespace Impl {

template <typename ArgT>
struct MatchAllOf;
template <typename ArgT>
struct MatchAnyOf;
template <typename ArgT>
struct MatchNotOf;

class MatcherUntypedBase {
public:
    MatcherUntypedBase() = default;
    MatcherUntypedBase(MatcherUntypedBase const &) = default;
    MatcherUntypedBase &operator=(MatcherUntypedBase const &) = delete;
    std::string toString() const;

protected:
    virtual ~MatcherUntypedBase();
    virtual std::string describe() const = 0;
    mutable std::string m_cachedToString;
};

#ifdef __clang__
#pragma clang diagnostic push
#pragma clang diagnostic ignored "-Wnon-virtual-dtor"
#endif

template <typename ObjectT>
struct MatcherMethod {
    virtual bool match(ObjectT const &arg) const = 0;
};

#if defined(__OBJC__)
// Hack to fix Catch GH issue #1661. Could use id for generic Object support.
// use of const for Object pointers is very uncommon and under ARC it causes
// some kind of signature mismatch that breaks compilation
template <>
struct MatcherMethod<NSString *> {
    virtual bool match(NSString *arg) const = 0;
};
#endif

#ifdef __clang__
#pragma clang diagnostic pop
#endif

template <typename T>
struct MatcherBase : MatcherUntypedBase, MatcherMethod<T> {
    MatchAllOf<T> operator&&(MatcherBase const &other) const;
    MatchAnyOf<T> operator||(MatcherBase const &other) const;
    MatchNotOf<T> operator!() const;
};

template <typename ArgT>
struct MatchAllOf : MatcherBase<ArgT> {
    bool match(ArgT const &arg) const override {
        for (auto matcher : m_matchers) {
            if (!matcher->match(arg))
                return false;
        }
        return true;
    }
    std::string describe() const override {
        std::string description;
        description.reserve(4 + m_matchers.size() * 32);
        description += "( ";
        bool first = true;
        for (auto matcher : m_matchers) {
            if (first)
                first = false;
            else
                description += " and ";
            description += matcher->toString();
        }
        description += " )";
        return description;
    }

    MatchAllOf<ArgT> operator&&(MatcherBase<ArgT> const &other) {
        auto copy(*this);
        copy.m_matchers.push_back(&other);
        return copy;
    }

    std::vector<MatcherBase<ArgT> const *> m_matchers;
};
template <typename ArgT>
struct MatchAnyOf : MatcherBase<ArgT> {
    bool match(ArgT const &arg) const override {
        for (auto matcher : m_matchers) {
            if (matcher->match(arg))
                return true;
        }
        return false;
    }
    std::string describe() const override {
        std::string description;
        description.reserve(4 + m_matchers.size() * 32);
        description += "( ";
        bool first = true;
        for (auto matcher : m_matchers) {
            if (first)
                first = false;
            else
                description += " or ";
            description += matcher->toString();
        }
        description += " )";
        return description;
    }

    MatchAnyOf<ArgT> operator||(MatcherBase<ArgT> const &other) {
        auto copy(*this);
        copy.m_matchers.push_back(&other);
        return copy;
    }

    std::vector<MatcherBase<ArgT> const *> m_matchers;
};

template <typename ArgT>
struct MatchNotOf : MatcherBase<ArgT> {
    MatchNotOf(MatcherBase<ArgT> const &underlyingMatcher)
            : m_underlyingMatcher(underlyingMatcher) {}

    bool match(ArgT const &arg) const override { return !m_underlyingMatcher.match(arg); }

    std::string describe() const override { return "not " + m_underlyingMatcher.toString(); }
    MatcherBase<ArgT> const &m_underlyingMatcher;
};

template <typename T>
MatchAllOf<T> MatcherBase<T>::operator&&(MatcherBase const &other) const {
    return MatchAllOf<T>() && *this && other;
}
template <typename T>
MatchAnyOf<T> MatcherBase<T>::operator||(MatcherBase const &other) const {
    return MatchAnyOf<T>() || *this || other;
}
template <typename T>
MatchNotOf<T> MatcherBase<T>::operator!() const {
    return MatchNotOf<T>(*this);
}

}  // namespace Impl

}  // namespace Matchers

using namespace Matchers;
using Matchers::Impl::MatcherBase;

}  // namespace Catch

// end catch_matchers.h
// start catch_matchers_exception.hpp

namespace Catch {
namespace Matchers {
namespace Exception {

class ExceptionMessageMatcher : public MatcherBase<std::exception> {
    std::string m_message;

public:
    ExceptionMessageMatcher(std::string const &message) : m_message(message) {}

    bool match(std::exception const &ex) const override;

    std::string describe() const override;
};

}  // namespace Exception

Exception::ExceptionMessageMatcher Message(std::string const &message);

}  // namespace Matchers
}  // namespace Catch

// end catch_matchers_exception.hpp
// start catch_matchers_floating.h

namespace Catch {
namespace Matchers {

namespace Floating {

enum class FloatingPointKind : uint8_t;

struct WithinAbsMatcher : MatcherBase<double> {
    WithinAbsMatcher(double target, double margin);
    bool match(double const &matchee) const override;
    std::string describe() const override;

private:
    double m_target;
    double m_margin;
};

struct WithinUlpsMatcher : MatcherBase<double> {
    WithinUlpsMatcher(double target, uint64_t ulps, FloatingPointKind baseType);
    bool match(double const &matchee) const override;
    std::string describe() const override;

private:
    double m_target;
    uint64_t m_ulps;
    FloatingPointKind m_type;
};

// Given IEEE-754 format for floats and doubles, we can assume
// that float -> double promotion is lossless. Given this, we can
// assume that if we do the standard relative comparison of
// |lhs - rhs| <= epsilon * max(fabs(lhs), fabs(rhs)), then we get
// the same result if we do this for floats, as if we do this for
// doubles that were promoted from floats.
struct WithinRelMatcher : MatcherBase<double> {
    WithinRelMatcher(double target, double epsilon);
    bool match(double const &matchee) const override;
    std::string describe() const override;

private:
    double m_target;
    double m_epsilon;
};

}  // namespace Floating

// The following functions create the actual matcher objects.
// This allows the types to be inferred
Floating::WithinUlpsMatcher WithinULP(double target, uint64_t maxUlpDiff);
Floating::WithinUlpsMatcher WithinULP(float target, uint64_t maxUlpDiff);
Floating::WithinAbsMatcher WithinAbs(double target, double margin);
Floating::WithinRelMatcher WithinRel(double target, double eps);
// defaults epsilon to 100*numeric_limits<double>::epsilon()
Floating::WithinRelMatcher WithinRel(double target);
Floating::WithinRelMatcher WithinRel(float target, float eps);
// defaults epsilon to 100*numeric_limits<float>::epsilon()
Floating::WithinRelMatcher WithinRel(float target);

}  // namespace Matchers
}  // namespace Catch

// end catch_matchers_floating.h
// start catch_matchers_generic.hpp

#include <functional>
#include <string>

namespace Catch {
namespace Matchers {
namespace Generic {

namespace Detail {
std::string finalizeDescription(const std::string &desc);
}

template <typename T>
class PredicateMatcher : public MatcherBase<T> {
    std::function<bool(T const &)> m_predicate;
    std::string m_description;

public:
    PredicateMatcher(std::function<bool(T const &)> const &elem, std::string const &descr)
            : m_predicate(std::move(elem)), m_description(Detail::finalizeDescription(descr)) {}

    bool match(T const &item) const override { return m_predicate(item); }

    std::string describe() const override { return m_description; }
};

}  // namespace Generic

// The following functions create the actual matcher objects.
// The user has to explicitly specify type to the function, because
// inferring std::function<bool(T const&)> is hard (but possible) and
// requires a lot of TMP.
template <typename T>
Generic::PredicateMatcher<T> Predicate(std::function<bool(T const &)> const &predicate,
                                       std::string const &description = "") {
    return Generic::PredicateMatcher<T>(predicate, description);
}

}  // namespace Matchers
}  // namespace Catch

// end catch_matchers_generic.hpp
// start catch_matchers_string.h

#include <string>

namespace Catch {
namespace Matchers {

namespace StdString {

struct CasedString {
    CasedString(std::string const &str, CaseSensitive::Choice caseSensitivity);
    std::string adjustString(std::string const &str) const;
    std::string caseSensitivitySuffix() const;

    CaseSensitive::Choice m_caseSensitivity;
    std::string m_str;
};

struct StringMatcherBase : MatcherBase<std::string> {
    StringMatcherBase(std::string const &operation, CasedString const &comparator);
    std::string describe() const override;

    CasedString m_comparator;
    std::string m_operation;
};

struct EqualsMatcher : StringMatcherBase {
    EqualsMatcher(CasedString const &comparator);
    bool match(std::string const &source) const override;
};
struct ContainsMatcher : StringMatcherBase {
    ContainsMatcher(CasedString const &comparator);
    bool match(std::string const &source) const override;
};
struct StartsWithMatcher : StringMatcherBase {
    StartsWithMatcher(CasedString const &comparator);
    bool match(std::string const &source) const override;
};
struct EndsWithMatcher : StringMatcherBase {
    EndsWithMatcher(CasedString const &comparator);
    bool match(std::string const &source) const override;
};

struct RegexMatcher : MatcherBase<std::string> {
    RegexMatcher(std::string regex, CaseSensitive::Choice caseSensitivity);
    bool match(std::string const &matchee) const override;
    std::string describe() const override;

private:
    std::string m_regex;
    CaseSensitive::Choice m_caseSensitivity;
};

}  // namespace StdString

// The following functions create the actual matcher objects.
// This allows the types to be inferred

StdString::EqualsMatcher Equals(std::string const &str,
                                CaseSensitive::Choice caseSensitivity = CaseSensitive::Yes);
StdString::ContainsMatcher Contains(std::string const &str,
                                    CaseSensitive::Choice caseSensitivity = CaseSensitive::Yes);
StdString::EndsWithMatcher EndsWith(std::string const &str,
                                    CaseSensitive::Choice caseSensitivity = CaseSensitive::Yes);
StdString::StartsWithMatcher StartsWith(std::string const &str,
                                        CaseSensitive::Choice caseSensitivity = CaseSensitive::Yes);
StdString::RegexMatcher Matches(std::string const &regex,
                                CaseSensitive::Choice caseSensitivity = CaseSensitive::Yes);

}  // namespace Matchers
}  // namespace Catch

// end catch_matchers_string.h
// start catch_matchers_vector.h

#include <algorithm>

namespace Catch {
namespace Matchers {

namespace Vector {
template <typename T, typename Alloc>
struct ContainsElementMatcher : MatcherBase<std::vector<T, Alloc>> {
    ContainsElementMatcher(T const &comparator) : m_comparator(comparator) {}

    bool match(std::vector<T, Alloc> const &v) const override {
        for (auto const &el : v) {
            if (el == m_comparator) {
                return true;
            }
        }
        return false;
    }

    std::string describe() const override {
        return "Contains: " + ::Catch::Detail::stringify(m_comparator);
    }

    T const &m_comparator;
};

template <typename T, typename AllocComp, typename AllocMatch>
struct ContainsMatcher : MatcherBase<std::vector<T, AllocMatch>> {
    ContainsMatcher(std::vector<T, AllocComp> const &comparator) : m_comparator(comparator) {}

    bool match(std::vector<T, AllocMatch> const &v) const override {
        // !TBD: see note in EqualsMatcher
        if (m_comparator.size() > v.size())
            return false;
        for (auto const &comparator : m_comparator) {
            auto present = false;
            for (const auto &el : v) {
                if (el == comparator) {
                    present = true;
                    break;
                }
            }
            if (!present) {
                return false;
            }
        }
        return true;
    }
    std::string describe() const override {
        return "Contains: " + ::Catch::Detail::stringify(m_comparator);
    }

    std::vector<T, AllocComp> const &m_comparator;
};

template <typename T, typename AllocComp, typename AllocMatch>
struct EqualsMatcher : MatcherBase<std::vector<T, AllocMatch>> {
    EqualsMatcher(std::vector<T, AllocComp> const &comparator) : m_comparator(comparator) {}

    bool match(std::vector<T, AllocMatch> const &v) const override {
        // !TBD: This currently works if all elements can be compared using !=
        // - a more general approach would be via a compare template that defaults
        // to using !=. but could be specialised for, e.g. std::vector<T, Alloc> etc
        // - then just call that directly
        if (m_comparator.size() != v.size())
            return false;
        for (std::size_t i = 0; i < v.size(); ++i)
            if (m_comparator[i] != v[i])
                return false;
        return true;
    }
    std::string describe() const override {
        return "Equals: " + ::Catch::Detail::stringify(m_comparator);
    }
    std::vector<T, AllocComp> const &m_comparator;
};

template <typename T, typename AllocComp, typename AllocMatch>
struct ApproxMatcher : MatcherBase<std::vector<T, AllocMatch>> {
    ApproxMatcher(std::vector<T, AllocComp> const &comparator) : m_comparator(comparator) {}

    bool match(std::vector<T, AllocMatch> const &v) const override {
        if (m_comparator.size() != v.size())
            return false;
        for (std::size_t i = 0; i < v.size(); ++i)
            if (m_comparator[i] != approx(v[i]))
                return false;
        return true;
    }
    std::string describe() const override {
        return "is approx: " + ::Catch::Detail::stringify(m_comparator);
    }
    template <typename = typename std::enable_if<std::is_constructible<double, T>::value>::type>
    ApproxMatcher &epsilon(T const &newEpsilon) {
        approx.epsilon(newEpsilon);
        return *this;
    }
    template <typename = typename std::enable_if<std::is_constructible<double, T>::value>::type>
    ApproxMatcher &margin(T const &newMargin) {
        approx.margin(newMargin);
        return *this;
    }
    template <typename = typename std::enable_if<std::is_constructible<double, T>::value>::type>
    ApproxMatcher &scale(T const &newScale) {
        approx.scale(newScale);
        return *this;
    }

    std::vector<T, AllocComp> const &m_comparator;
    mutable Catch::Detail::Approx approx = Catch::Detail::Approx::custom();
};

template <typename T, typename AllocComp, typename AllocMatch>
struct UnorderedEqualsMatcher : MatcherBase<std::vector<T, AllocMatch>> {
    UnorderedEqualsMatcher(std::vector<T, AllocComp> const &target) : m_target(target) {}
    bool match(std::vector<T, AllocMatch> const &vec) const override {
        if (m_target.size() != vec.size()) {
            return false;
        }
        return std::is_permutation(m_target.begin(), m_target.end(), vec.begin());
    }

    std::string describe() const override {
        return "UnorderedEquals: " + ::Catch::Detail::stringify(m_target);
    }

private:
    std::vector<T, AllocComp> const &m_target;
};

}  // namespace Vector

// The following functions create the actual matcher objects.
// This allows the types to be inferred

template <typename T, typename AllocComp = std::allocator<T>, typename AllocMatch = AllocComp>
Vector::ContainsMatcher<T, AllocComp, AllocMatch> Contains(
        std::vector<T, AllocComp> const &comparator) {
    return Vector::ContainsMatcher<T, AllocComp, AllocMatch>(comparator);
}

template <typename T, typename Alloc = std::allocator<T>>
Vector::ContainsElementMatcher<T, Alloc> VectorContains(T const &comparator) {
    return Vector::ContainsElementMatcher<T, Alloc>(comparator);
}

template <typename T, typename AllocComp = std::allocator<T>, typename AllocMatch = AllocComp>
Vector::EqualsMatcher<T, AllocComp, AllocMatch> Equals(
        std::vector<T, AllocComp> const &comparator) {
    return Vector::EqualsMatcher<T, AllocComp, AllocMatch>(comparator);
}

template <typename T, typename AllocComp = std::allocator<T>, typename AllocMatch = AllocComp>
Vector::ApproxMatcher<T, AllocComp, AllocMatch> Approx(
        std::vector<T, AllocComp> const &comparator) {
    return Vector::ApproxMatcher<T, AllocComp, AllocMatch>(comparator);
}

template <typename T, typename AllocComp = std::allocator<T>, typename AllocMatch = AllocComp>
Vector::UnorderedEqualsMatcher<T, AllocComp, AllocMatch> UnorderedEquals(
        std::vector<T, AllocComp> const &target) {
    return Vector::UnorderedEqualsMatcher<T, AllocComp, AllocMatch>(target);
}

}  // namespace Matchers
}  // namespace Catch

// end catch_matchers_vector.h
namespace Catch {

template <typename ArgT, typename MatcherT>
class MatchExpr : public ITransientExpression {
    ArgT const &m_arg;
    MatcherT m_matcher;
    StringRef m_matcherString;

public:
    MatchExpr(ArgT const &arg, MatcherT const &matcher, StringRef const &matcherString)
            : ITransientExpression{true, matcher.match(arg)},
              m_arg(arg),
              m_matcher(matcher),
              m_matcherString(matcherString) {}

    void streamReconstructedExpression(std::ostream &os) const override {
        auto matcherAsString = m_matcher.toString();
        os << Catch::Detail::stringify(m_arg) << ' ';
        if (matcherAsString == Detail::unprintableString)
            os << m_matcherString;
        else
            os << matcherAsString;
    }
};

using StringMatcher = Matchers::Impl::MatcherBase<std::string>;

void handleExceptionMatchExpr(AssertionHandler &handler,
                              StringMatcher const &matcher,
                              StringRef const &matcherString);

template <typename ArgT, typename MatcherT>
auto makeMatchExpr(ArgT const &arg, MatcherT const &matcher, StringRef const &matcherString)
        -> MatchExpr<ArgT, MatcherT> {
    return MatchExpr<ArgT, MatcherT>(arg, matcher, matcherString);
}

}  // namespace Catch

///////////////////////////////////////////////////////////////////////////////
#define INTERNAL_CHECK_THAT(macroName, matcher, resultDisposition, arg)               \
    do {                                                                              \
        Catch::AssertionHandler catchAssertionHandler(                                \
                macroName##_catch_sr, CATCH_INTERNAL_LINEINFO,                        \
                CATCH_INTERNAL_STRINGIFY(arg) ", " CATCH_INTERNAL_STRINGIFY(matcher), \
                resultDisposition);                                                   \
        INTERNAL_CATCH_TRY {                                                          \
            catchAssertionHandler.handleExpr(                                         \
                    Catch::makeMatchExpr(arg, matcher, #matcher##_catch_sr));         \
        }                                                                             \
        INTERNAL_CATCH_CATCH(catchAssertionHandler)                                   \
        INTERNAL_CATCH_REACT(catchAssertionHandler)                                   \
    } while (false)

///////////////////////////////////////////////////////////////////////////////
#define INTERNAL_CATCH_THROWS_MATCHES(macroName, exceptionType, resultDisposition, matcher, ...) \
    do {                                                                                         \
        Catch::AssertionHandler catchAssertionHandler(                                           \
                macroName##_catch_sr, CATCH_INTERNAL_LINEINFO,                                   \
                CATCH_INTERNAL_STRINGIFY(__VA_ARGS__) ", " CATCH_INTERNAL_STRINGIFY(             \
                        exceptionType) ", " CATCH_INTERNAL_STRINGIFY(matcher),                   \
                resultDisposition);                                                              \
        if (catchAssertionHandler.allowThrows())                                                 \
            try {                                                                                \
                static_cast<void>(__VA_ARGS__);                                                  \
                catchAssertionHandler.handleUnexpectedExceptionNotThrown();                      \
            } catch (exceptionType const &ex) {                                                  \
                catchAssertionHandler.handleExpr(                                                \
                        Catch::makeMatchExpr(ex, matcher, #matcher##_catch_sr));                 \
            } catch (...) {                                                                      \
                catchAssertionHandler.handleUnexpectedInflightException();                       \
            }                                                                                    \
        else                                                                                     \
            catchAssertionHandler.handleThrowingCallSkipped();                                   \
        INTERNAL_CATCH_REACT(catchAssertionHandler)                                              \
    } while (false)

// end catch_capture_matchers.h
#endif
// start catch_generators.hpp

// start catch_interfaces_generatortracker.h

#include <memory>

namespace Catch {

namespace Generators {
class GeneratorUntypedBase {
public:
    GeneratorUntypedBase() = default;
    virtual ~GeneratorUntypedBase();
    // Attempts to move the generator to the next element
    //
    // Returns true iff the move succeeded (and a valid element
    // can be retrieved).
    virtual bool next() = 0;
};
using GeneratorBasePtr = std::unique_ptr<GeneratorUntypedBase>;

}  // namespace Generators

struct IGeneratorTracker {
    virtual ~IGeneratorTracker();
    virtual auto hasGenerator() const -> bool = 0;
    virtual auto getGenerator() const -> Generators::GeneratorBasePtr const & = 0;
    virtual void setGenerator(Generators::GeneratorBasePtr &&generator) = 0;
};

}  // namespace Catch

// end catch_interfaces_generatortracker.h
// start catch_enforce.h

#include <exception>

namespace Catch {
#if !defined(CATCH_CONFIG_DISABLE_EXCEPTIONS)
template <typename Ex>
[[noreturn]] void throw_exception(Ex const &e) {
    throw e;
}
#else  // ^^ Exceptions are enabled //  Exceptions are disabled vv
[[noreturn]] void throw_exception(std::exception const &e);
#endif

[[noreturn]] void throw_logic_error(std::string const &msg);
[[noreturn]] void throw_domain_error(std::string const &msg);
[[noreturn]] void throw_runtime_error(std::string const &msg);

}  // namespace Catch

#define CATCH_MAKE_MSG(...) (Catch::ReusableStringStream() << __VA_ARGS__).str()

#define CATCH_INTERNAL_ERROR(...) \
    Catch::throw_logic_error(     \
            CATCH_MAKE_MSG(CATCH_INTERNAL_LINEINFO << ": Internal Catch2 error: " << __VA_ARGS__))

#define CATCH_ERROR(...) Catch::throw_domain_error(CATCH_MAKE_MSG(__VA_ARGS__))

#define CATCH_RUNTIME_ERROR(...) Catch::throw_runtime_error(CATCH_MAKE_MSG(__VA_ARGS__))

#define CATCH_ENFORCE(condition, ...) \
    do {                              \
        if (!(condition))             \
            CATCH_ERROR(__VA_ARGS__); \
    } while (false)

// end catch_enforce.h
#include <cassert>
#include <exception>
#include <memory>
#include <utility>
#include <vector>

namespace Catch {

class GeneratorException : public std::exception {
    const char *const m_msg = "";

public:
    GeneratorException(const char *msg) : m_msg(msg) {}

    const char *what() const noexcept override final;
};

namespace Generators {

// !TBD move this into its own location?
namespace pf {
template <typename T, typename... Args>
std::unique_ptr<T> make_unique(Args &&...args) {
    return std::unique_ptr<T>(new T(std::forward<Args>(args)...));
}
}  // namespace pf

template <typename T>
struct IGenerator : GeneratorUntypedBase {
    virtual ~IGenerator() = default;

    // Returns the current element of the generator
    //
    // \Precondition The generator is either freshly constructed,
    // or the last call to `next()` returned true
    virtual T const &get() const = 0;
    using type = T;
};

template <typename T>
class SingleValueGenerator final : public IGenerator<T> {
    T m_value;

public:
    SingleValueGenerator(T &&value) : m_value(std::move(value)) {}

    T const &get() const override { return m_value; }
    bool next() override { return false; }
};

template <typename T>
class FixedValuesGenerator final : public IGenerator<T> {
    static_assert(!std::is_same<T, bool>::value,
                  "FixedValuesGenerator does not support bools because of std::vector<bool>"
                  "specialization, use SingleValue Generator instead.");
    std::vector<T> m_values;
    size_t m_idx = 0;

public:
    FixedValuesGenerator(std::initializer_list<T> values) : m_values(values) {}

    T const &get() const override { return m_values[m_idx]; }
    bool next() override {
        ++m_idx;
        return m_idx < m_values.size();
    }
};

template <typename T>
class GeneratorWrapper final {
    std::unique_ptr<IGenerator<T>> m_generator;

public:
    GeneratorWrapper(std::unique_ptr<IGenerator<T>> generator)
            : m_generator(std::move(generator)) {}
    T const &get() const { return m_generator->get(); }
    bool next() { return m_generator->next(); }
};

template <typename T>
GeneratorWrapper<T> value(T &&value) {
    return GeneratorWrapper<T>(pf::make_unique<SingleValueGenerator<T>>(std::forward<T>(value)));
}
template <typename T>
GeneratorWrapper<T> values(std::initializer_list<T> values) {
    return GeneratorWrapper<T>(pf::make_unique<FixedValuesGenerator<T>>(values));
}

template <typename T>
class Generators : public IGenerator<T> {
    std::vector<GeneratorWrapper<T>> m_generators;
    size_t m_current = 0;

    void populate(GeneratorWrapper<T> &&generator) {
        m_generators.emplace_back(std::move(generator));
    }
    void populate(T &&val) { m_generators.emplace_back(value(std::forward<T>(val))); }
    template <typename U>
    void populate(U &&val) {
        populate(T(std::forward<U>(val)));
    }
    template <typename U, typename... Gs>
    void populate(U &&valueOrGenerator, Gs &&...moreGenerators) {
        populate(std::forward<U>(valueOrGenerator));
        populate(std::forward<Gs>(moreGenerators)...);
    }

public:
    template <typename... Gs>
    Generators(Gs &&...moreGenerators) {
        m_generators.reserve(sizeof...(Gs));
        populate(std::forward<Gs>(moreGenerators)...);
    }

    T const &get() const override { return m_generators[m_current].get(); }

    bool next() override {
        if (m_current >= m_generators.size()) {
            return false;
        }
        const bool current_status = m_generators[m_current].next();
        if (!current_status) {
            ++m_current;
        }
        return m_current < m_generators.size();
    }
};

template <typename... Ts>
GeneratorWrapper<std::tuple<Ts...>> table(
        std::initializer_list<std::tuple<typename std::decay<Ts>::type...>> tuples) {
    return values<std::tuple<Ts...>>(tuples);
}

// Tag type to signal that a generator sequence should convert arguments to a
// specific type
template <typename T>
struct as {};

template <typename T, typename... Gs>
auto makeGenerators(GeneratorWrapper<T> &&generator, Gs &&...moreGenerators) -> Generators<T> {
    return Generators<T>(std::move(generator), std::forward<Gs>(moreGenerators)...);
}
template <typename T>
auto makeGenerators(GeneratorWrapper<T> &&generator) -> Generators<T> {
    return Generators<T>(std::move(generator));
}
template <typename T, typename... Gs>
auto makeGenerators(T &&val, Gs &&...moreGenerators) -> Generators<T> {
    return makeGenerators(value(std::forward<T>(val)), std::forward<Gs>(moreGenerators)...);
}
template <typename T, typename U, typename... Gs>
auto makeGenerators(as<T>, U &&val, Gs &&...moreGenerators) -> Generators<T> {
    return makeGenerators(value(T(std::forward<U>(val))), std::forward<Gs>(moreGenerators)...);
}

auto acquireGeneratorTracker(StringRef generatorName, SourceLineInfo const &lineInfo)
        -> IGeneratorTracker &;

template <typename L>
// Note: The type after -> is weird, because VS2015 cannot parse
//       the expression used in the typedef inside, when it is in
//       return type. Yeah.
auto generate(StringRef generatorName, SourceLineInfo const &lineInfo, L const &generatorExpression)
        -> decltype(std::declval<decltype(generatorExpression())>().get()) {
    using UnderlyingType = typename decltype(generatorExpression())::type;

    IGeneratorTracker &tracker = acquireGeneratorTracker(generatorName, lineInfo);
    if (!tracker.hasGenerator()) {
        tracker.setGenerator(pf::make_unique<Generators<UnderlyingType>>(generatorExpression()));
    }

    auto const &generator =
            static_cast<IGenerator<UnderlyingType> const &>(*tracker.getGenerator());
    return generator.get();
}

}  // namespace Generators
}  // namespace Catch

#define GENERATE(...)                                                                            \
    Catch::Generators::generate(INTERNAL_CATCH_STRINGIZE(INTERNAL_CATCH_UNIQUE_NAME(generator)), \
                                CATCH_INTERNAL_LINEINFO, [] {                                    \
                                    using namespace Catch::Generators;                           \
                                    return makeGenerators(__VA_ARGS__);                          \
                                })  // NOLINT(google-build-using-namespace)
#define GENERATE_COPY(...)                                                                       \
    Catch::Generators::generate(INTERNAL_CATCH_STRINGIZE(INTERNAL_CATCH_UNIQUE_NAME(generator)), \
                                CATCH_INTERNAL_LINEINFO, [=] {                                   \
                                    using namespace Catch::Generators;                           \
                                    return makeGenerators(__VA_ARGS__);                          \
                                })  // NOLINT(google-build-using-namespace)
#define GENERATE_REF(...)                                                                        \
    Catch::Generators::generate(INTERNAL_CATCH_STRINGIZE(INTERNAL_CATCH_UNIQUE_NAME(generator)), \
                                CATCH_INTERNAL_LINEINFO, [&] {                                   \
                                    using namespace Catch::Generators;                           \
                                    return makeGenerators(__VA_ARGS__);                          \
                                })  // NOLINT(google-build-using-namespace)

// end catch_generators.hpp
// start catch_generators_generic.hpp

namespace Catch {
namespace Generators {

template <typename T>
class TakeGenerator : public IGenerator<T> {
    GeneratorWrapper<T> m_generator;
    size_t m_returned = 0;
    size_t m_target;

public:
    TakeGenerator(size_t target, GeneratorWrapper<T> &&generator)
            : m_generator(std::move(generator)), m_target(target) {
        assert(target != 0 && "Empty generators are not allowed");
    }
    T const &get() const override { return m_generator.get(); }
    bool next() override {
        ++m_returned;
        if (m_returned >= m_target) {
            return false;
        }

        const auto success = m_generator.next();
        // If the underlying generator does not contain enough values
        // then we cut short as well
        if (!success) {
            m_returned = m_target;
        }
        return success;
    }
};

template <typename T>
GeneratorWrapper<T> take(size_t target, GeneratorWrapper<T> &&generator) {
    return GeneratorWrapper<T>(pf::make_unique<TakeGenerator<T>>(target, std::move(generator)));
}

template <typename T, typename Predicate>
class FilterGenerator : public IGenerator<T> {
    GeneratorWrapper<T> m_generator;
    Predicate m_predicate;

public:
    template <typename P = Predicate>
    FilterGenerator(P &&pred, GeneratorWrapper<T> &&generator)
            : m_generator(std::move(generator)), m_predicate(std::forward<P>(pred)) {
        if (!m_predicate(m_generator.get())) {
            // It might happen that there are no values that pass the
            // filter. In that case we throw an exception.
            auto has_initial_value = next();
            if (!has_initial_value) {
                Catch::throw_exception(
                        GeneratorException("No valid value found in filtered generator"));
            }
        }
    }

    T const &get() const override { return m_generator.get(); }

    bool next() override {
        bool success = m_generator.next();
        if (!success) {
            return false;
        }
        while (!m_predicate(m_generator.get()) && (success = m_generator.next()) == true)
            ;
        return success;
    }
};

template <typename T, typename Predicate>
GeneratorWrapper<T> filter(Predicate &&pred, GeneratorWrapper<T> &&generator) {
    return GeneratorWrapper<T>(
            std::unique_ptr<IGenerator<T>>(pf::make_unique<FilterGenerator<T, Predicate>>(
                    std::forward<Predicate>(pred), std::move(generator))));
}

template <typename T>
class RepeatGenerator : public IGenerator<T> {
    static_assert(!std::is_same<T, bool>::value,
                  "RepeatGenerator currently does not support bools"
                  "because of std::vector<bool> specialization");
    GeneratorWrapper<T> m_generator;
    mutable std::vector<T> m_returned;
    size_t m_target_repeats;
    size_t m_current_repeat = 0;
    size_t m_repeat_index = 0;

public:
    RepeatGenerator(size_t repeats, GeneratorWrapper<T> &&generator)
            : m_generator(std::move(generator)), m_target_repeats(repeats) {
        assert(m_target_repeats > 0 && "Repeat generator must repeat at least once");
    }

    T const &get() const override {
        if (m_current_repeat == 0) {
            m_returned.push_back(m_generator.get());
            return m_returned.back();
        }
        return m_returned[m_repeat_index];
    }

    bool next() override {
        // There are 2 basic cases:
        // 1) We are still reading the generator
        // 2) We are reading our own cache

        // In the first case, we need to poke the underlying generator.
        // If it happily moves, we are left in that state, otherwise it is time to
        // start reading from our cache
        if (m_current_repeat == 0) {
            const auto success = m_generator.next();
            if (!success) {
                ++m_current_repeat;
            }
            return m_current_repeat < m_target_repeats;
        }

        // In the second case, we need to move indices forward and check that we
        // haven't run up against the end
        ++m_repeat_index;
        if (m_repeat_index == m_returned.size()) {
            m_repeat_index = 0;
            ++m_current_repeat;
        }
        return m_current_repeat < m_target_repeats;
    }
};

template <typename T>
GeneratorWrapper<T> repeat(size_t repeats, GeneratorWrapper<T> &&generator) {
    return GeneratorWrapper<T>(pf::make_unique<RepeatGenerator<T>>(repeats, std::move(generator)));
}

template <typename T, typename U, typename Func>
class MapGenerator : public IGenerator<T> {
    // TBD: provide static assert for mapping function, for friendly error message
    GeneratorWrapper<U> m_generator;
    Func m_function;
    // To avoid returning dangling reference, we have to save the values
    T m_cache;

public:
    template <typename F2 = Func>
    MapGenerator(F2 &&function, GeneratorWrapper<U> &&generator)
            : m_generator(std::move(generator)),
              m_function(std::forward<F2>(function)),
              m_cache(m_function(m_generator.get())) {}

    T const &get() const override { return m_cache; }
    bool next() override {
        const auto success = m_generator.next();
        if (success) {
            m_cache = m_function(m_generator.get());
        }
        return success;
    }
};

template <typename Func, typename U, typename T = FunctionReturnType<Func, U>>
GeneratorWrapper<T> map(Func &&function, GeneratorWrapper<U> &&generator) {
    return GeneratorWrapper<T>(pf::make_unique<MapGenerator<T, U, Func>>(
            std::forward<Func>(function), std::move(generator)));
}

template <typename T, typename U, typename Func>
GeneratorWrapper<T> map(Func &&function, GeneratorWrapper<U> &&generator) {
    return GeneratorWrapper<T>(pf::make_unique<MapGenerator<T, U, Func>>(
            std::forward<Func>(function), std::move(generator)));
}

template <typename T>
class ChunkGenerator final : public IGenerator<std::vector<T>> {
    std::vector<T> m_chunk;
    size_t m_chunk_size;
    GeneratorWrapper<T> m_generator;
    bool m_used_up = false;

public:
    ChunkGenerator(size_t size, GeneratorWrapper<T> generator)
            : m_chunk_size(size), m_generator(std::move(generator)) {
        m_chunk.reserve(m_chunk_size);
        if (m_chunk_size != 0) {
            m_chunk.push_back(m_generator.get());
            for (size_t i = 1; i < m_chunk_size; ++i) {
                if (!m_generator.next()) {
                    Catch::throw_exception(
                            GeneratorException("Not enough values to initialize the first chunk"));
                }
                m_chunk.push_back(m_generator.get());
            }
        }
    }
    std::vector<T> const &get() const override { return m_chunk; }
    bool next() override {
        m_chunk.clear();
        for (size_t idx = 0; idx < m_chunk_size; ++idx) {
            if (!m_generator.next()) {
                return false;
            }
            m_chunk.push_back(m_generator.get());
        }
        return true;
    }
};

template <typename T>
GeneratorWrapper<std::vector<T>> chunk(size_t size, GeneratorWrapper<T> &&generator) {
    return GeneratorWrapper<std::vector<T>>(
            pf::make_unique<ChunkGenerator<T>>(size, std::move(generator)));
}

}  // namespace Generators
}  // namespace Catch

// end catch_generators_generic.hpp
// start catch_generators_specific.hpp

// start catch_context.h

#include <memory>

namespace Catch {

struct IResultCapture;
struct IRunner;
struct IConfig;
struct IMutableContext;

using IConfigPtr = std::shared_ptr<IConfig const>;

struct IContext {
    virtual ~IContext();

    virtual IResultCapture *getResultCapture() = 0;
    virtual IRunner *getRunner() = 0;
    virtual IConfigPtr const &getConfig() const = 0;
};

struct IMutableContext : IContext {
    virtual ~IMutableContext();
    virtual void setResultCapture(IResultCapture *resultCapture) = 0;
    virtual void setRunner(IRunner *runner) = 0;
    virtual void setConfig(IConfigPtr const &config) = 0;

private:
    static IMutableContext *currentContext;
    friend IMutableContext &getCurrentMutableContext();
    friend void cleanUpContext();
    static void createContext();
};

inline IMutableContext &getCurrentMutableContext() {
    if (!IMutableContext::currentContext)
        IMutableContext::createContext();
    // NOLINTNEXTLINE(clang-analyzer-core.uninitialized.UndefReturn)
    return *IMutableContext::currentContext;
}

inline IContext &getCurrentContext() { return getCurrentMutableContext(); }

void cleanUpContext();

class SimplePcg32;
SimplePcg32 &rng();
}  // namespace Catch

// end catch_context.h
// start catch_interfaces_config.h

// start catch_option.hpp

namespace Catch {

// An optional type
template <typename T>
class Option {
public:
    Option() : nullableValue(nullptr) {}
    Option(T const &_value) : nullableValue(new (storage) T(_value)) {}
    Option(Option const &_other) : nullableValue(_other ? new (storage) T(*_other) : nullptr) {}

    ~Option() { reset(); }

    Option &operator=(Option const &_other) {
        if (&_other != this) {
            reset();
            if (_other)
                nullableValue = new (storage) T(*_other);
        }
        return *this;
    }
    Option &operator=(T const &_value) {
        reset();
        nullableValue = new (storage) T(_value);
        return *this;
    }

    void reset() {
        if (nullableValue)
            nullableValue->~T();
        nullableValue = nullptr;
    }

    T &operator*() { return *nullableValue; }
    T const &operator*() const { return *nullableValue; }
    T *operator->() { return nullableValue; }
    const T *operator->() const { return nullableValue; }

    T valueOr(T const &defaultValue) const { return nullableValue ? *nullableValue : defaultValue; }

    bool some() const { return nullableValue != nullptr; }
    bool none() const { return nullableValue == nullptr; }

    bool operator!() const { return nullableValue == nullptr; }
    explicit operator bool() const { return some(); }

private:
    T *nullableValue;
    alignas(alignof(T)) char storage[sizeof(T)];
};

}  // end namespace Catch

// end catch_option.hpp
#include <chrono>
#include <iosfwd>
#include <memory>
#include <string>
#include <vector>

namespace Catch {

enum class Verbosity { Quiet = 0, Normal, High };

struct WarnAbout {
    enum What { Nothing = 0x00, NoAssertions = 0x01, NoTests = 0x02 };
};

struct ShowDurations {
    enum OrNot { DefaultForReporter, Always, Never };
};
struct RunTests {
    enum InWhatOrder { InDeclarationOrder, InLexicographicalOrder, InRandomOrder };
};
struct UseColour {
    enum YesOrNo { Auto, Yes, No };
};
struct WaitForKeypress {
    enum When {
        Never,
        BeforeStart = 1,
        BeforeExit = 2,
        BeforeStartAndExit = BeforeStart | BeforeExit
    };
};

class TestSpec;

struct IConfig : NonCopyable {
    virtual ~IConfig();

    virtual bool allowThrows() const = 0;
    virtual std::ostream &stream() const = 0;
    virtual std::string name() const = 0;
    virtual bool includeSuccessfulResults() const = 0;
    virtual bool shouldDebugBreak() const = 0;
    virtual bool warnAboutMissingAssertions() const = 0;
    virtual bool warnAboutNoTests() const = 0;
    virtual int abortAfter() const = 0;
    virtual bool showInvisibles() const = 0;
    virtual ShowDurations::OrNot showDurations() const = 0;
    virtual double minDuration() const = 0;
    virtual TestSpec const &testSpec() const = 0;
    virtual bool hasTestFilters() const = 0;
    virtual std::vector<std::string> const &getTestsOrTags() const = 0;
    virtual RunTests::InWhatOrder runOrder() const = 0;
    virtual unsigned int rngSeed() const = 0;
    virtual UseColour::YesOrNo useColour() const = 0;
    virtual std::vector<std::string> const &getSectionsToRun() const = 0;
    virtual Verbosity verbosity() const = 0;

    virtual bool benchmarkNoAnalysis() const = 0;
    virtual int benchmarkSamples() const = 0;
    virtual double benchmarkConfidenceInterval() const = 0;
    virtual unsigned int benchmarkResamples() const = 0;
    virtual std::chrono::milliseconds benchmarkWarmupTime() const = 0;
};

using IConfigPtr = std::shared_ptr<IConfig const>;
}  // namespace Catch

// end catch_interfaces_config.h
// start catch_random_number_generator.h

#include <cstdint>

namespace Catch {

// This is a simple implementation of C++11 Uniform Random Number
// Generator. It does not provide all operators, because Catch2
// does not use it, but it should behave as expected inside stdlib's
// distributions.
// The implementation is based on the PCG family (http://pcg-random.org)
class SimplePcg32 {
    using state_type = std::uint64_t;

public:
    using result_type = std::uint32_t;
    static constexpr result_type(min)() { return 0; }
    static constexpr result_type(max)() { return static_cast<result_type>(-1); }

    // Provide some default initial state for the default constructor
    SimplePcg32() : SimplePcg32(0xed743cc4U) {}

    explicit SimplePcg32(result_type seed_);

    void seed(result_type seed_);
    void discard(uint64_t skip);

    result_type operator()();

private:
    friend bool operator==(SimplePcg32 const &lhs, SimplePcg32 const &rhs);
    friend bool operator!=(SimplePcg32 const &lhs, SimplePcg32 const &rhs);

    // In theory we also need operator<< and operator>>
    // In practice we do not use them, so we will skip them for now

    std::uint64_t m_state;
    // This part of the state determines which "stream" of the numbers
    // is chosen -- we take it as a constant for Catch2, so we only
    // need to deal with seeding the main state.
    // Picked by reading 8 bytes from `/dev/random` :-)
    static const std::uint64_t s_inc = (0x13ed0cc53f939476ULL << 1ULL) | 1ULL;
};

}  // end namespace Catch

// end catch_random_number_generator.h
#include <random>

namespace Catch {
namespace Generators {

template <typename Float>
class RandomFloatingGenerator final : public IGenerator<Float> {
    Catch::SimplePcg32 &m_rng;
    std::uniform_real_distribution<Float> m_dist;
    Float m_current_number;

public:
    RandomFloatingGenerator(Float a, Float b) : m_rng(rng()), m_dist(a, b) {
        static_cast<void>(next());
    }

    Float const &get() const override { return m_current_number; }
    bool next() override {
        m_current_number = m_dist(m_rng);
        return true;
    }
};

template <typename Integer>
class RandomIntegerGenerator final : public IGenerator<Integer> {
    Catch::SimplePcg32 &m_rng;
    std::uniform_int_distribution<Integer> m_dist;
    Integer m_current_number;

public:
    RandomIntegerGenerator(Integer a, Integer b) : m_rng(rng()), m_dist(a, b) {
        static_cast<void>(next());
    }

    Integer const &get() const override { return m_current_number; }
    bool next() override {
        m_current_number = m_dist(m_rng);
        return true;
    }
};

// TODO: Ideally this would be also constrained against the various char types,
//       but I don't expect users to run into that in practice.
template <typename T>
typename std::enable_if<std::is_integral<T>::value && !std::is_same<T, bool>::value,
                        GeneratorWrapper<T>>::type
random(T a, T b) {
    return GeneratorWrapper<T>(pf::make_unique<RandomIntegerGenerator<T>>(a, b));
}

template <typename T>
typename std::enable_if<std::is_floating_point<T>::value, GeneratorWrapper<T>>::type random(T a,
                                                                                            T b) {
    return GeneratorWrapper<T>(pf::make_unique<RandomFloatingGenerator<T>>(a, b));
}

template <typename T>
class RangeGenerator final : public IGenerator<T> {
    T m_current;
    T m_end;
    T m_step;
    bool m_positive;

public:
    RangeGenerator(T const &start, T const &end, T const &step)
            : m_current(start), m_end(end), m_step(step), m_positive(m_step > T(0)) {
        assert(m_current != m_end && "Range start and end cannot be equal");
        assert(m_step != T(0) && "Step size cannot be zero");
        assert(((m_positive && m_current <= m_end) || (!m_positive && m_current >= m_end)) &&
               "Step moves away from end");
    }

    RangeGenerator(T const &start, T const &end)
            : RangeGenerator(start, end, (start < end) ? T(1) : T(-1)) {}

    T const &get() const override { return m_current; }

    bool next() override {
        m_current += m_step;
        return (m_positive) ? (m_current < m_end) : (m_current > m_end);
    }
};

template <typename T>
GeneratorWrapper<T> range(T const &start, T const &end, T const &step) {
    static_assert(std::is_arithmetic<T>::value && !std::is_same<T, bool>::value,
                  "Type must be numeric");
    return GeneratorWrapper<T>(pf::make_unique<RangeGenerator<T>>(start, end, step));
}

template <typename T>
GeneratorWrapper<T> range(T const &start, T const &end) {
    static_assert(std::is_integral<T>::value && !std::is_same<T, bool>::value,
                  "Type must be an integer");
    return GeneratorWrapper<T>(pf::make_unique<RangeGenerator<T>>(start, end));
}

template <typename T>
class IteratorGenerator final : public IGenerator<T> {
    static_assert(!std::is_same<T, bool>::value,
                  "IteratorGenerator currently does not support bools"
                  "because of std::vector<bool> specialization");

    std::vector<T> m_elems;
    size_t m_current = 0;

public:
    template <typename InputIterator, typename InputSentinel>
    IteratorGenerator(InputIterator first, InputSentinel last) : m_elems(first, last) {
        if (m_elems.empty()) {
            Catch::throw_exception(
                    GeneratorException("IteratorGenerator received no valid values"));
        }
    }

    T const &get() const override { return m_elems[m_current]; }

    bool next() override {
        ++m_current;
        return m_current != m_elems.size();
    }
};

template <typename InputIterator,
          typename InputSentinel,
          typename ResultType = typename std::iterator_traits<InputIterator>::value_type>
GeneratorWrapper<ResultType> from_range(InputIterator from, InputSentinel to) {
    return GeneratorWrapper<ResultType>(pf::make_unique<IteratorGenerator<ResultType>>(from, to));
}

template <typename Container, typename ResultType = typename Container::value_type>
GeneratorWrapper<ResultType> from_range(Container const &cnt) {
    return GeneratorWrapper<ResultType>(
            pf::make_unique<IteratorGenerator<ResultType>>(cnt.begin(), cnt.end()));
}

}  // namespace Generators
}  // namespace Catch

// end catch_generators_specific.hpp

// These files are included here so the single_include script doesn't put them
// in the conditionally compiled sections
// start catch_test_case_info.h

#include <memory>
#include <string>
#include <vector>

#ifdef __clang__
#pragma clang diagnostic push
#pragma clang diagnostic ignored "-Wpadded"
#endif

namespace Catch {

struct ITestInvoker;

struct TestCaseInfo {
    enum SpecialProperties {
        None = 0,
        IsHidden = 1 << 1,
        ShouldFail = 1 << 2,
        MayFail = 1 << 3,
        Throws = 1 << 4,
        NonPortable = 1 << 5,
        Benchmark = 1 << 6
    };

    TestCaseInfo(std::string const &_name,
                 std::string const &_className,
                 std::string const &_description,
                 std::vector<std::string> const &_tags,
                 SourceLineInfo const &_lineInfo);

    friend void setTags(TestCaseInfo &testCaseInfo, std::vector<std::string> tags);

    bool isHidden() const;
    bool throws() const;
    bool okToFail() const;
    bool expectedToFail() const;

    std::string tagsAsString() const;

    std::string name;
    std::string className;
    std::string description;
    std::vector<std::string> tags;
    std::vector<std::string> lcaseTags;
    SourceLineInfo lineInfo;
    SpecialProperties properties;
};

class TestCase : public TestCaseInfo {
public:
    TestCase(ITestInvoker *testCase, TestCaseInfo &&info);

    TestCase withName(std::string const &_newName) const;

    void invoke() const;

    TestCaseInfo const &getTestCaseInfo() const;

    bool operator==(TestCase const &other) const;
    bool operator<(TestCase const &other) const;

private:
    std::shared_ptr<ITestInvoker> test;
};

TestCase makeTestCase(ITestInvoker *testCase,
                      std::string const &className,
                      NameAndTags const &nameAndTags,
                      SourceLineInfo const &lineInfo);
}  // namespace Catch

#ifdef __clang__
#pragma clang diagnostic pop
#endif

// end catch_test_case_info.h
// start catch_interfaces_runner.h

namespace Catch {

struct IRunner {
    virtual ~IRunner();
    virtual bool aborting() const = 0;
};
}  // namespace Catch

// end catch_interfaces_runner.h

#ifdef __OBJC__
// start catch_objc.hpp

#import <objc/runtime.h>

#include <string>

// NB. Any general catch headers included here must be included
// in catch.hpp first to make sure they are included by the single
// header for non obj-usage

///////////////////////////////////////////////////////////////////////////////
// This protocol is really only here for (self) documenting purposes, since
// all its methods are optional.
@protocol OcFixture

@optional

- (void)setUp;
- (void)tearDown;

@end

namespace Catch {

class OcMethod : public ITestInvoker {
public:
    OcMethod(Class cls, SEL sel) : m_cls(cls), m_sel(sel) {}

    virtual void invoke() const {
        id obj = [[m_cls alloc] init];

        performOptionalSelector(obj, @selector(setUp));
        performOptionalSelector(obj, m_sel);
        performOptionalSelector(obj, @selector(tearDown));

        arcSafeRelease(obj);
    }

private:
    virtual ~OcMethod() {}

    Class m_cls;
    SEL m_sel;
};

namespace Detail {

inline std::string getAnnotation(Class cls,
                                 std::string const &annotationName,
                                 std::string const &testCaseName) {
    NSString *selStr = [[NSString alloc]
            initWithFormat:@"Catch_%s_%s", annotationName.c_str(), testCaseName.c_str()];
    SEL sel = NSSelectorFromString(selStr);
    arcSafeRelease(selStr);
    id value = performOptionalSelector(cls, sel);
    if (value)
        return [(NSString *)value UTF8String];
    return "";
}
}  // namespace Detail

inline std::size_t registerTestMethods() {
    std::size_t noTestMethods = 0;
    int noClasses = objc_getClassList(nullptr, 0);

    Class *classes = (CATCH_UNSAFE_UNRETAINED Class *)malloc(sizeof(Class) * noClasses);
    objc_getClassList(classes, noClasses);

    for (int c = 0; c < noClasses; c++) {
        Class cls = classes[c];
        {
            u_int count;
            Method *methods = class_copyMethodList(cls, &count);
            for (u_int m = 0; m < count; m++) {
                SEL selector = method_getName(methods[m]);
                std::string methodName = sel_getName(selector);
                if (startsWith(methodName, "Catch_TestCase_")) {
                    std::string testCaseName = methodName.substr(15);
                    std::string name = Detail::getAnnotation(cls, "Name", testCaseName);
                    std::string desc = Detail::getAnnotation(cls, "Description", testCaseName);
                    const char *className = class_getName(cls);

                    getMutableRegistryHub().registerTest(makeTestCase(
                            new OcMethod(cls, selector), className,
                            NameAndTags(name.c_str(), desc.c_str()), SourceLineInfo("", 0)));
                    noTestMethods++;
                }
            }
            free(methods);
        }
    }
    return noTestMethods;
}

#if !defined(CATCH_CONFIG_DISABLE_MATCHERS)

namespace Matchers {
namespace Impl {
namespace NSStringMatchers {

struct StringHolder : MatcherBase<NSString *> {
    StringHolder(NSString *substr) : m_substr([substr copy]) {}
    StringHolder(StringHolder const &other) : m_substr([other.m_substr copy]) {}
    StringHolder() { arcSafeRelease(m_substr); }

    bool match(NSString *str) const override { return false; }

    NSString *CATCH_ARC_STRONG m_substr;
};

struct Equals : StringHolder {
    Equals(NSString *substr) : StringHolder(substr) {}

    bool match(NSString *str) const override {
        return (str != nil || m_substr == nil) && [str isEqualToString:m_substr];
    }

    std::string describe() const override {
        return "equals string: " + Catch::Detail::stringify(m_substr);
    }
};

struct Contains : StringHolder {
    Contains(NSString *substr) : StringHolder(substr) {}

    bool match(NSString *str) const override {
        return (str != nil || m_substr == nil) &&
               [str rangeOfString:m_substr].location != NSNotFound;
    }

    std::string describe() const override {
        return "contains string: " + Catch::Detail::stringify(m_substr);
    }
};

struct StartsWith : StringHolder {
    StartsWith(NSString *substr) : StringHolder(substr) {}

    bool match(NSString *str) const override {
        return (str != nil || m_substr == nil) && [str rangeOfString:m_substr].location == 0;
    }

    std::string describe() const override {
        return "starts with: " + Catch::Detail::stringify(m_substr);
    }
};
struct EndsWith : StringHolder {
    EndsWith(NSString *substr) : StringHolder(substr) {}

    bool match(NSString *str) const override {
        return (str != nil || m_substr == nil) &&
               [str rangeOfString:m_substr].location == [str length] - [m_substr length];
    }

    std::string describe() const override {
        return "ends with: " + Catch::Detail::stringify(m_substr);
    }
};

}  // namespace NSStringMatchers
}  // namespace Impl

inline Impl::NSStringMatchers::Equals Equals(NSString *substr) {
    return Impl::NSStringMatchers::Equals(substr);
}

inline Impl::NSStringMatchers::Contains Contains(NSString *substr) {
    return Impl::NSStringMatchers::Contains(substr);
}

inline Impl::NSStringMatchers::StartsWith StartsWith(NSString *substr) {
    return Impl::NSStringMatchers::StartsWith(substr);
}

inline Impl::NSStringMatchers::EndsWith EndsWith(NSString *substr) {
    return Impl::NSStringMatchers::EndsWith(substr);
}

}  // namespace Matchers

using namespace Matchers;

#endif  // CATCH_CONFIG_DISABLE_MATCHERS

}  // namespace Catch

///////////////////////////////////////////////////////////////////////////////
#define OC_MAKE_UNIQUE_NAME(root, uniqueSuffix) root##uniqueSuffix
#define OC_TEST_CASE2(name, desc, uniqueSuffix)                               \
    +(NSString *)OC_MAKE_UNIQUE_NAME(Catch_Name_test_, uniqueSuffix) {        \
        return @name;                                                         \
    }                                                                         \
    +(NSString *)OC_MAKE_UNIQUE_NAME(Catch_Description_test_, uniqueSuffix) { \
        return @desc;                                                         \
    }                                                                         \
    -(void)OC_MAKE_UNIQUE_NAME(Catch_TestCase_test_, uniqueSuffix)

#define OC_TEST_CASE(name, desc) OC_TEST_CASE2(name, desc, __LINE__)

// end catch_objc.hpp
#endif

// Benchmarking needs the externally-facing parts of reporters to work
#if defined(CATCH_CONFIG_EXTERNAL_INTERFACES) || defined(CATCH_CONFIG_ENABLE_BENCHMARKING)
// start catch_external_interfaces.h

// start catch_reporter_bases.hpp

// start catch_interfaces_reporter.h

// start catch_config.hpp

// start catch_test_spec_parser.h

#ifdef __clang__
#pragma clang diagnostic push
#pragma clang diagnostic ignored "-Wpadded"
#endif

// start catch_test_spec.h

#ifdef __clang__
#pragma clang diagnostic push
#pragma clang diagnostic ignored "-Wpadded"
#endif

// start catch_wildcard_pattern.h

namespace Catch {
class WildcardPattern {
    enum WildcardPosition {
        NoWildcard = 0,
        WildcardAtStart = 1,
        WildcardAtEnd = 2,
        WildcardAtBothEnds = WildcardAtStart | WildcardAtEnd
    };

public:
    WildcardPattern(std::string const &pattern, CaseSensitive::Choice caseSensitivity);
    virtual ~WildcardPattern() = default;
    virtual bool matches(std::string const &str) const;

private:
    std::string normaliseString(std::string const &str) const;
    CaseSensitive::Choice m_caseSensitivity;
    WildcardPosition m_wildcard = NoWildcard;
    std::string m_pattern;
};
}  // namespace Catch

// end catch_wildcard_pattern.h
#include <memory>
#include <string>
#include <vector>

namespace Catch {

struct IConfig;

class TestSpec {
    class Pattern {
    public:
        explicit Pattern(std::string const &name);
        virtual ~Pattern();
        virtual bool matches(TestCaseInfo const &testCase) const = 0;
        std::string const &name() const;

    private:
        std::string const m_name;
    };
    using PatternPtr = std::shared_ptr<Pattern>;

    class NamePattern : public Pattern {
    public:
        explicit NamePattern(std::string const &name, std::string const &filterString);
        bool matches(TestCaseInfo const &testCase) const override;

    private:
        WildcardPattern m_wildcardPattern;
    };

    class TagPattern : public Pattern {
    public:
        explicit TagPattern(std::string const &tag, std::string const &filterString);
        bool matches(TestCaseInfo const &testCase) const override;

    private:
        std::string m_tag;
    };

    class ExcludedPattern : public Pattern {
    public:
        explicit ExcludedPattern(PatternPtr const &underlyingPattern);
        bool matches(TestCaseInfo const &testCase) const override;

    private:
        PatternPtr m_underlyingPattern;
    };

    struct Filter {
        std::vector<PatternPtr> m_patterns;

        bool matches(TestCaseInfo const &testCase) const;
        std::string name() const;
    };

public:
    struct FilterMatch {
        std::string name;
        std::vector<TestCase const *> tests;
    };
    using Matches = std::vector<FilterMatch>;
    using vectorStrings = std::vector<std::string>;

    bool hasFilters() const;
    bool matches(TestCaseInfo const &testCase) const;
    Matches matchesByFilter(std::vector<TestCase> const &testCases, IConfig const &config) const;
    const vectorStrings &getInvalidArgs() const;

private:
    std::vector<Filter> m_filters;
    std::vector<std::string> m_invalidArgs;
    friend class TestSpecParser;
};
}  // namespace Catch

#ifdef __clang__
#pragma clang diagnostic pop
#endif

// end catch_test_spec.h
// start catch_interfaces_tag_alias_registry.h

#include <string>

namespace Catch {

struct TagAlias;

struct ITagAliasRegistry {
    virtual ~ITagAliasRegistry();
    // Nullptr if not present
    virtual TagAlias const *find(std::string const &alias) const = 0;
    virtual std::string expandAliases(std::string const &unexpandedTestSpec) const = 0;

    static ITagAliasRegistry const &get();
};

}  // end namespace Catch

// end catch_interfaces_tag_alias_registry.h
namespace Catch {

class TestSpecParser {
    enum Mode { None, Name, QuotedName, Tag, EscapedName };
    Mode m_mode = None;
    Mode lastMode = None;
    bool m_exclusion = false;
    std::size_t m_pos = 0;
    std::size_t m_realPatternPos = 0;
    std::string m_arg;
    std::string m_substring;
    std::string m_patternName;
    std::vector<std::size_t> m_escapeChars;
    TestSpec::Filter m_currentFilter;
    TestSpec m_testSpec;
    ITagAliasRegistry const *m_tagAliases = nullptr;

public:
    TestSpecParser(ITagAliasRegistry const &tagAliases);

    TestSpecParser &parse(std::string const &arg);
    TestSpec testSpec();

private:
    bool visitChar(char c);
    void startNewMode(Mode mode);
    bool processNoneChar(char c);
    void processNameChar(char c);
    bool processOtherChar(char c);
    void endMode();
    void escape();
    bool isControlChar(char c) const;
    void saveLastMode();
    void revertBackToLastMode();
    void addFilter();
    bool separate();

    // Handles common preprocessing of the pattern for name/tag patterns
    std::string preprocessPattern();
    // Adds the current pattern as a test name
    void addNamePattern();
    // Adds the current pattern as a tag
    void addTagPattern();

    inline void addCharToPattern(char c) {
        m_substring += c;
        m_patternName += c;
        m_realPatternPos++;
    }
};
TestSpec parseTestSpec(std::string const &arg);

}  // namespace Catch

#ifdef __clang__
#pragma clang diagnostic pop
#endif

// end catch_test_spec_parser.h
// Libstdc++ doesn't like incomplete classes for unique_ptr

#include <memory>
#include <string>
#include <vector>

#ifndef CATCH_CONFIG_CONSOLE_WIDTH
#define CATCH_CONFIG_CONSOLE_WIDTH 80
#endif

namespace Catch {

struct IStream;

struct ConfigData {
    bool listTests = false;
    bool listTags = false;
    bool listReporters = false;
    bool listTestNamesOnly = false;

    bool showSuccessfulTests = false;
    bool shouldDebugBreak = false;
    bool noThrow = false;
    bool showHelp = false;
    bool showInvisibles = false;
    bool filenamesAsTags = false;
    bool libIdentify = false;

    int abortAfter = -1;
    unsigned int rngSeed = 0;

    bool benchmarkNoAnalysis = false;
    unsigned int benchmarkSamples = 100;
    double benchmarkConfidenceInterval = 0.95;
    unsigned int benchmarkResamples = 100000;
    std::chrono::milliseconds::rep benchmarkWarmupTime = 100;

    Verbosity verbosity = Verbosity::Normal;
    WarnAbout::What warnings = WarnAbout::Nothing;
    ShowDurations::OrNot showDurations = ShowDurations::DefaultForReporter;
    double minDuration = -1;
    RunTests::InWhatOrder runOrder = RunTests::InDeclarationOrder;
    UseColour::YesOrNo useColour = UseColour::Auto;
    WaitForKeypress::When waitForKeypress = WaitForKeypress::Never;

    std::string outputFilename;
    std::string name;
    std::string processName;
#ifndef CATCH_CONFIG_DEFAULT_REPORTER
#define CATCH_CONFIG_DEFAULT_REPORTER "console"
#endif
    std::string reporterName = CATCH_CONFIG_DEFAULT_REPORTER;
#undef CATCH_CONFIG_DEFAULT_REPORTER

    std::vector<std::string> testsOrTags;
    std::vector<std::string> sectionsToRun;
};

class Config : public IConfig {
public:
    Config() = default;
    Config(ConfigData const &data);
    virtual ~Config() = default;

    std::string const &getFilename() const;

    bool listTests() const;
    bool listTestNamesOnly() const;
    bool listTags() const;
    bool listReporters() const;

    std::string getProcessName() const;
    std::string const &getReporterName() const;

    std::vector<std::string> const &getTestsOrTags() const override;
    std::vector<std::string> const &getSectionsToRun() const override;

    TestSpec const &testSpec() const override;
    bool hasTestFilters() const override;

    bool showHelp() const;

    // IConfig interface
    bool allowThrows() const override;
    std::ostream &stream() const override;
    std::string name() const override;
    bool includeSuccessfulResults() const override;
    bool warnAboutMissingAssertions() const override;
    bool warnAboutNoTests() const override;
    ShowDurations::OrNot showDurations() const override;
    double minDuration() const override;
    RunTests::InWhatOrder runOrder() const override;
    unsigned int rngSeed() const override;
    UseColour::YesOrNo useColour() const override;
    bool shouldDebugBreak() const override;
    int abortAfter() const override;
    bool showInvisibles() const override;
    Verbosity verbosity() const override;
    bool benchmarkNoAnalysis() const override;
    int benchmarkSamples() const override;
    double benchmarkConfidenceInterval() const override;
    unsigned int benchmarkResamples() const override;
    std::chrono::milliseconds benchmarkWarmupTime() const override;

private:
    IStream const *openStream();
    ConfigData m_data;

    std::unique_ptr<IStream const> m_stream;
    TestSpec m_testSpec;
    bool m_hasTestFilters = false;
};

}  // end namespace Catch

// end catch_config.hpp
// start catch_assertionresult.h

#include <string>

namespace Catch {

struct AssertionResultData {
    AssertionResultData() = delete;

    AssertionResultData(ResultWas::OfType _resultType, LazyExpression const &_lazyExpression);

    std::string message;
    mutable std::string reconstructedExpression;
    LazyExpression lazyExpression;
    ResultWas::OfType resultType;

    std::string reconstructExpression() const;
};

class AssertionResult {
public:
    AssertionResult() = delete;
    AssertionResult(AssertionInfo const &info, AssertionResultData const &data);

    bool isOk() const;
    bool succeeded() const;
    ResultWas::OfType getResultType() const;
    bool hasExpression() const;
    bool hasMessage() const;
    std::string getExpression() const;
    std::string getExpressionInMacro() const;
    bool hasExpandedExpression() const;
    std::string getExpandedExpression() const;
    std::string getMessage() const;
    SourceLineInfo getSourceInfo() const;
    StringRef getTestMacroName() const;

    // protected:
    AssertionInfo m_info;
    AssertionResultData m_resultData;
};

}  // end namespace Catch

// end catch_assertionresult.h
#if defined(CATCH_CONFIG_ENABLE_BENCHMARKING)
// start catch_estimate.hpp

// Statistics estimates

namespace Catch {
namespace Benchmark {
template <typename Duration>
struct Estimate {
    Duration point;
    Duration lower_bound;
    Duration upper_bound;
    double confidence_interval;

    template <typename Duration2>
    operator Estimate<Duration2>() const {
        return {point, lower_bound, upper_bound, confidence_interval};
    }
};
}  // namespace Benchmark
}  // namespace Catch

// end catch_estimate.hpp
// start catch_outlier_classification.hpp

// Outlier information

namespace Catch {
namespace Benchmark {
struct OutlierClassification {
    int samples_seen = 0;
    int low_severe = 0;   // more than 3 times IQR below Q1
    int low_mild = 0;     // 1.5 to 3 times IQR below Q1
    int high_mild = 0;    // 1.5 to 3 times IQR above Q3
    int high_severe = 0;  // more than 3 times IQR above Q3

    int total() const { return low_severe + low_mild + high_mild + high_severe; }
};
}  // namespace Benchmark
}  // namespace Catch

// end catch_outlier_classification.hpp

#include <iterator>
#endif  // CATCH_CONFIG_ENABLE_BENCHMARKING

#include <algorithm>
#include <iosfwd>
#include <map>
#include <memory>
#include <set>
#include <string>

namespace Catch {

struct ReporterConfig {
    explicit ReporterConfig(IConfigPtr const &_fullConfig);

    ReporterConfig(IConfigPtr const &_fullConfig, std::ostream &_stream);

    std::ostream &stream() const;
    IConfigPtr fullConfig() const;

private:
    std::ostream *m_stream;
    IConfigPtr m_fullConfig;
};

struct ReporterPreferences {
    bool shouldRedirectStdOut = false;
    bool shouldReportAllAssertions = false;
};

template <typename T>
struct LazyStat : Option<T> {
    LazyStat &operator=(T const &_value) {
        Option<T>::operator=(_value);
        used = false;
        return *this;
    }
    void reset() {
        Option<T>::reset();
        used = false;
    }
    bool used = false;
};

struct TestRunInfo {
    TestRunInfo(std::string const &_name);
    std::string name;
};
struct GroupInfo {
    GroupInfo(std::string const &_name, std::size_t _groupIndex, std::size_t _groupsCount);

    std::string name;
    std::size_t groupIndex;
    std::size_t groupsCounts;
};

struct AssertionStats {
    AssertionStats(AssertionResult const &_assertionResult,
                   std::vector<MessageInfo> const &_infoMessages,
                   Totals const &_totals);

    AssertionStats(AssertionStats const &) = default;
    AssertionStats(AssertionStats &&) = default;
    AssertionStats &operator=(AssertionStats const &) = delete;
    AssertionStats &operator=(AssertionStats &&) = delete;
    virtual ~AssertionStats();

    AssertionResult assertionResult;
    std::vector<MessageInfo> infoMessages;
    Totals totals;
};

struct SectionStats {
    SectionStats(SectionInfo const &_sectionInfo,
                 Counts const &_assertions,
                 double _durationInSeconds,
                 bool _missingAssertions);
    SectionStats(SectionStats const &) = default;
    SectionStats(SectionStats &&) = default;
    SectionStats &operator=(SectionStats const &) = default;
    SectionStats &operator=(SectionStats &&) = default;
    virtual ~SectionStats();

    SectionInfo sectionInfo;
    Counts assertions;
    double durationInSeconds;
    bool missingAssertions;
};

struct TestCaseStats {
    TestCaseStats(TestCaseInfo const &_testInfo,
                  Totals const &_totals,
                  std::string const &_stdOut,
                  std::string const &_stdErr,
                  bool _aborting);

    TestCaseStats(TestCaseStats const &) = default;
    TestCaseStats(TestCaseStats &&) = default;
    TestCaseStats &operator=(TestCaseStats const &) = default;
    TestCaseStats &operator=(TestCaseStats &&) = default;
    virtual ~TestCaseStats();

    TestCaseInfo testInfo;
    Totals totals;
    std::string stdOut;
    std::string stdErr;
    bool aborting;
};

struct TestGroupStats {
    TestGroupStats(GroupInfo const &_groupInfo, Totals const &_totals, bool _aborting);
    TestGroupStats(GroupInfo const &_groupInfo);

    TestGroupStats(TestGroupStats const &) = default;
    TestGroupStats(TestGroupStats &&) = default;
    TestGroupStats &operator=(TestGroupStats const &) = default;
    TestGroupStats &operator=(TestGroupStats &&) = default;
    virtual ~TestGroupStats();

    GroupInfo groupInfo;
    Totals totals;
    bool aborting;
};

struct TestRunStats {
    TestRunStats(TestRunInfo const &_runInfo, Totals const &_totals, bool _aborting);

    TestRunStats(TestRunStats const &) = default;
    TestRunStats(TestRunStats &&) = default;
    TestRunStats &operator=(TestRunStats const &) = default;
    TestRunStats &operator=(TestRunStats &&) = default;
    virtual ~TestRunStats();

    TestRunInfo runInfo;
    Totals totals;
    bool aborting;
};

#if defined(CATCH_CONFIG_ENABLE_BENCHMARKING)
struct BenchmarkInfo {
    std::string name;
    double estimatedDuration;
    int iterations;
    int samples;
    unsigned int resamples;
    double clockResolution;
    double clockCost;
};

template <class Duration>
struct BenchmarkStats {
    BenchmarkInfo info;

    std::vector<Duration> samples;
    Benchmark::Estimate<Duration> mean;
    Benchmark::Estimate<Duration> standardDeviation;
    Benchmark::OutlierClassification outliers;
    double outlierVariance;

    template <typename Duration2>
    operator BenchmarkStats<Duration2>() const {
        std::vector<Duration2> samples2;
        samples2.reserve(samples.size());
        std::transform(samples.begin(), samples.end(), std::back_inserter(samples2),
                       [](Duration d) { return Duration2(d); });
        return {
                info, std::move(samples2), mean, standardDeviation, outliers, outlierVariance,
        };
    }
};
#endif  // CATCH_CONFIG_ENABLE_BENCHMARKING

struct IStreamingReporter {
    virtual ~IStreamingReporter() = default;

    // Implementing class must also provide the following static methods:
    // static std::string getDescription();
    // static std::set<Verbosity> getSupportedVerbosities()

    virtual ReporterPreferences getPreferences() const = 0;

    virtual void noMatchingTestCases(std::string const &spec) = 0;

    virtual void reportInvalidArguments(std::string const &) {}

    virtual void testRunStarting(TestRunInfo const &testRunInfo) = 0;
    virtual void testGroupStarting(GroupInfo const &groupInfo) = 0;

    virtual void testCaseStarting(TestCaseInfo const &testInfo) = 0;
    virtual void sectionStarting(SectionInfo const &sectionInfo) = 0;

#if defined(CATCH_CONFIG_ENABLE_BENCHMARKING)
    virtual void benchmarkPreparing(std::string const &) {}
    virtual void benchmarkStarting(BenchmarkInfo const &) {}
    virtual void benchmarkEnded(BenchmarkStats<> const &) {}
    virtual void benchmarkFailed(std::string const &) {}
#endif  // CATCH_CONFIG_ENABLE_BENCHMARKING

    virtual void assertionStarting(AssertionInfo const &assertionInfo) = 0;

    // The return value indicates if the messages buffer should be cleared:
    virtual bool assertionEnded(AssertionStats const &assertionStats) = 0;

    virtual void sectionEnded(SectionStats const &sectionStats) = 0;
    virtual void testCaseEnded(TestCaseStats const &testCaseStats) = 0;
    virtual void testGroupEnded(TestGroupStats const &testGroupStats) = 0;
    virtual void testRunEnded(TestRunStats const &testRunStats) = 0;

    virtual void skipTest(TestCaseInfo const &testInfo) = 0;

    // Default empty implementation provided
    virtual void fatalErrorEncountered(StringRef name);

    virtual bool isMulti() const;
};
using IStreamingReporterPtr = std::unique_ptr<IStreamingReporter>;

struct IReporterFactory {
    virtual ~IReporterFactory();
    virtual IStreamingReporterPtr create(ReporterConfig const &config) const = 0;
    virtual std::string getDescription() const = 0;
};
using IReporterFactoryPtr = std::shared_ptr<IReporterFactory>;

struct IReporterRegistry {
    using FactoryMap = std::map<std::string, IReporterFactoryPtr>;
    using Listeners = std::vector<IReporterFactoryPtr>;

    virtual ~IReporterRegistry();
    virtual IStreamingReporterPtr create(std::string const &name,
                                         IConfigPtr const &config) const = 0;
    virtual FactoryMap const &getFactories() const = 0;
    virtual Listeners const &getListeners() const = 0;
};

}  // end namespace Catch

// end catch_interfaces_reporter.h
#include <algorithm>
#include <cassert>
#include <cfloat>
#include <cstdio>
#include <cstring>
#include <memory>
#include <ostream>

namespace Catch {
void prepareExpandedExpression(AssertionResult &result);

// Returns double formatted as %.3f (format expected on output)
std::string getFormattedDuration(double duration);

//! Should the reporter show
bool shouldShowDuration(IConfig const &config, double duration);

std::string serializeFilters(std::vector<std::string> const &container);

template <typename DerivedT>
struct StreamingReporterBase : IStreamingReporter {
    StreamingReporterBase(ReporterConfig const &_config)
            : m_config(_config.fullConfig()), stream(_config.stream()) {
        m_reporterPrefs.shouldRedirectStdOut = false;
        if (!DerivedT::getSupportedVerbosities().count(m_config->verbosity()))
            CATCH_ERROR("Verbosity level not supported by this reporter");
    }

    ReporterPreferences getPreferences() const override { return m_reporterPrefs; }

    static std::set<Verbosity> getSupportedVerbosities() { return {Verbosity::Normal}; }

    ~StreamingReporterBase() override = default;

    void noMatchingTestCases(std::string const &) override {}

    void reportInvalidArguments(std::string const &) override {}

    void testRunStarting(TestRunInfo const &_testRunInfo) override {
        currentTestRunInfo = _testRunInfo;
    }

    void testGroupStarting(GroupInfo const &_groupInfo) override { currentGroupInfo = _groupInfo; }

    void testCaseStarting(TestCaseInfo const &_testInfo) override {
        currentTestCaseInfo = _testInfo;
    }
    void sectionStarting(SectionInfo const &_sectionInfo) override {
        m_sectionStack.push_back(_sectionInfo);
    }

    void sectionEnded(SectionStats const & /* _sectionStats */) override {
        m_sectionStack.pop_back();
    }
    void testCaseEnded(TestCaseStats const & /* _testCaseStats */) override {
        currentTestCaseInfo.reset();
    }
    void testGroupEnded(TestGroupStats const & /* _testGroupStats */) override {
        currentGroupInfo.reset();
    }
    void testRunEnded(TestRunStats const & /* _testRunStats */) override {
        currentTestCaseInfo.reset();
        currentGroupInfo.reset();
        currentTestRunInfo.reset();
    }

    void skipTest(TestCaseInfo const &) override {
        // Don't do anything with this by default.
        // It can optionally be overridden in the derived class.
    }

    IConfigPtr m_config;
    std::ostream &stream;

    LazyStat<TestRunInfo> currentTestRunInfo;
    LazyStat<GroupInfo> currentGroupInfo;
    LazyStat<TestCaseInfo> currentTestCaseInfo;

    std::vector<SectionInfo> m_sectionStack;
    ReporterPreferences m_reporterPrefs;
};

template <typename DerivedT>
struct CumulativeReporterBase : IStreamingReporter {
    template <typename T, typename ChildNodeT>
    struct Node {
        explicit Node(T const &_value) : value(_value) {}
        virtual ~Node() {}

        using ChildNodes = std::vector<std::shared_ptr<ChildNodeT>>;
        T value;
        ChildNodes children;
    };
    struct SectionNode {
        explicit SectionNode(SectionStats const &_stats) : stats(_stats) {}
        virtual ~SectionNode() = default;

        bool operator==(SectionNode const &other) const {
            return stats.sectionInfo.lineInfo == other.stats.sectionInfo.lineInfo;
        }
        bool operator==(std::shared_ptr<SectionNode> const &other) const {
            return operator==(*other);
        }

        SectionStats stats;
        using ChildSections = std::vector<std::shared_ptr<SectionNode>>;
        using Assertions = std::vector<AssertionStats>;
        ChildSections childSections;
        Assertions assertions;
        std::string stdOut;
        std::string stdErr;
    };

    struct BySectionInfo {
        BySectionInfo(SectionInfo const &other) : m_other(other) {}
        BySectionInfo(BySectionInfo const &other) : m_other(other.m_other) {}
        bool operator()(std::shared_ptr<SectionNode> const &node) const {
            return ((node->stats.sectionInfo.name == m_other.name) &&
                    (node->stats.sectionInfo.lineInfo == m_other.lineInfo));
        }
        void operator=(BySectionInfo const &) = delete;

    private:
        SectionInfo const &m_other;
    };

    using TestCaseNode = Node<TestCaseStats, SectionNode>;
    using TestGroupNode = Node<TestGroupStats, TestCaseNode>;
    using TestRunNode = Node<TestRunStats, TestGroupNode>;

    CumulativeReporterBase(ReporterConfig const &_config)
            : m_config(_config.fullConfig()), stream(_config.stream()) {
        m_reporterPrefs.shouldRedirectStdOut = false;
        if (!DerivedT::getSupportedVerbosities().count(m_config->verbosity()))
            CATCH_ERROR("Verbosity level not supported by this reporter");
    }
    ~CumulativeReporterBase() override = default;

    ReporterPreferences getPreferences() const override { return m_reporterPrefs; }

    static std::set<Verbosity> getSupportedVerbosities() { return {Verbosity::Normal}; }

    void testRunStarting(TestRunInfo const &) override {}
    void testGroupStarting(GroupInfo const &) override {}

    void testCaseStarting(TestCaseInfo const &) override {}

    void sectionStarting(SectionInfo const &sectionInfo) override {
        SectionStats incompleteStats(sectionInfo, Counts(), 0, false);
        std::shared_ptr<SectionNode> node;
        if (m_sectionStack.empty()) {
            if (!m_rootSection)
                m_rootSection = std::make_shared<SectionNode>(incompleteStats);
            node = m_rootSection;
        } else {
            SectionNode &parentNode = *m_sectionStack.back();
            auto it = std::find_if(parentNode.childSections.begin(), parentNode.childSections.end(),
                                   BySectionInfo(sectionInfo));
            if (it == parentNode.childSections.end()) {
                node = std::make_shared<SectionNode>(incompleteStats);
                parentNode.childSections.push_back(node);
            } else
                node = *it;
        }
        m_sectionStack.push_back(node);
        m_deepestSection = std::move(node);
    }

    void assertionStarting(AssertionInfo const &) override {}

    bool assertionEnded(AssertionStats const &assertionStats) override {
        assert(!m_sectionStack.empty());
        // AssertionResult holds a pointer to a temporary DecomposedExpression,
        // which getExpandedExpression() calls to build the expression string.
        // Our section stack copy of the assertionResult will likely outlive the
        // temporary, so it must be expanded or discarded now to avoid calling
        // a destroyed object later.
        prepareExpandedExpression(const_cast<AssertionResult &>(assertionStats.assertionResult));
        SectionNode &sectionNode = *m_sectionStack.back();
        sectionNode.assertions.push_back(assertionStats);
        return true;
    }
    void sectionEnded(SectionStats const &sectionStats) override {
        assert(!m_sectionStack.empty());
        SectionNode &node = *m_sectionStack.back();
        node.stats = sectionStats;
        m_sectionStack.pop_back();
    }
    void testCaseEnded(TestCaseStats const &testCaseStats) override {
        auto node = std::make_shared<TestCaseNode>(testCaseStats);
        assert(m_sectionStack.size() == 0);
        node->children.push_back(m_rootSection);
        m_testCases.push_back(node);
        m_rootSection.reset();

        assert(m_deepestSection);
        m_deepestSection->stdOut = testCaseStats.stdOut;
        m_deepestSection->stdErr = testCaseStats.stdErr;
    }
    void testGroupEnded(TestGroupStats const &testGroupStats) override {
        auto node = std::make_shared<TestGroupNode>(testGroupStats);
        node->children.swap(m_testCases);
        m_testGroups.push_back(node);
    }
    void testRunEnded(TestRunStats const &testRunStats) override {
        auto node = std::make_shared<TestRunNode>(testRunStats);
        node->children.swap(m_testGroups);
        m_testRuns.push_back(node);
        testRunEndedCumulative();
    }
    virtual void testRunEndedCumulative() = 0;

    void skipTest(TestCaseInfo const &) override {}

    IConfigPtr m_config;
    std::ostream &stream;
    std::vector<AssertionStats> m_assertions;
    std::vector<std::vector<std::shared_ptr<SectionNode>>> m_sections;
    std::vector<std::shared_ptr<TestCaseNode>> m_testCases;
    std::vector<std::shared_ptr<TestGroupNode>> m_testGroups;

    std::vector<std::shared_ptr<TestRunNode>> m_testRuns;

    std::shared_ptr<SectionNode> m_rootSection;
    std::shared_ptr<SectionNode> m_deepestSection;
    std::vector<std::shared_ptr<SectionNode>> m_sectionStack;
    ReporterPreferences m_reporterPrefs;
};

template <char C>
char const *getLineOfChars() {
    static char line[CATCH_CONFIG_CONSOLE_WIDTH] = {0};
    if (!*line) {
        std::memset(line, C, CATCH_CONFIG_CONSOLE_WIDTH - 1);
        line[CATCH_CONFIG_CONSOLE_WIDTH - 1] = 0;
    }
    return line;
}

struct TestEventListenerBase : StreamingReporterBase<TestEventListenerBase> {
    TestEventListenerBase(ReporterConfig const &_config);

    static std::set<Verbosity> getSupportedVerbosities();

    void assertionStarting(AssertionInfo const &) override;
    bool assertionEnded(AssertionStats const &) override;
};

}  // end namespace Catch

// end catch_reporter_bases.hpp
// start catch_console_colour.h

namespace Catch {

struct Colour {
    enum Code {
        None = 0,

        White,
        Red,
        Green,
        Blue,
        Cyan,
        Yellow,
        Grey,

        Bright = 0x10,

        BrightRed = Bright | Red,
        BrightGreen = Bright | Green,
        LightGrey = Bright | Grey,
        BrightWhite = Bright | White,
        BrightYellow = Bright | Yellow,

        // By intention
        FileName = LightGrey,
        Warning = BrightYellow,
        ResultError = BrightRed,
        ResultSuccess = BrightGreen,
        ResultExpectedFailure = Warning,

        Error = BrightRed,
        Success = Green,

        OriginalExpression = Cyan,
        ReconstructedExpression = BrightYellow,

        SecondaryText = LightGrey,
        Headers = White
    };

    // Use constructed object for RAII guard
    Colour(Code _colourCode);
    Colour(Colour &&other) noexcept;
    Colour &operator=(Colour &&other) noexcept;
    ~Colour();

    // Use static method for one-shot changes
    static void use(Code _colourCode);

private:
    bool m_moved = false;
};

std::ostream &operator<<(std::ostream &os, Colour const &);

}  // end namespace Catch

// end catch_console_colour.h
// start catch_reporter_registrars.hpp

namespace Catch {

template <typename T>
class ReporterRegistrar {
    class ReporterFactory : public IReporterFactory {
        IStreamingReporterPtr create(ReporterConfig const &config) const override {
            return std::unique_ptr<T>(new T(config));
        }

        std::string getDescription() const override { return T::getDescription(); }
    };

public:
    explicit ReporterRegistrar(std::string const &name) {
        getMutableRegistryHub().registerReporter(name, std::make_shared<ReporterFactory>());
    }
};

template <typename T>
class ListenerRegistrar {
    class ListenerFactory : public IReporterFactory {
        IStreamingReporterPtr create(ReporterConfig const &config) const override {
            return std::unique_ptr<T>(new T(config));
        }
        std::string getDescription() const override { return std::string(); }
    };

public:
    ListenerRegistrar() {
        getMutableRegistryHub().registerListener(std::make_shared<ListenerFactory>());
    }
};
}  // namespace Catch

#if !defined(CATCH_CONFIG_DISABLE)

#define CATCH_REGISTER_REPORTER(name, reporterType)                                         \
    CATCH_INTERNAL_START_WARNINGS_SUPPRESSION                                               \
    CATCH_INTERNAL_SUPPRESS_GLOBALS_WARNINGS                                                \
    namespace {                                                                             \
    Catch::ReporterRegistrar<reporterType> catch_internal_RegistrarFor##reporterType(name); \
    }                                                                                       \
    CATCH_INTERNAL_STOP_WARNINGS_SUPPRESSION

#define CATCH_REGISTER_LISTENER(listenerType)                                         \
    CATCH_INTERNAL_START_WARNINGS_SUPPRESSION                                         \
    CATCH_INTERNAL_SUPPRESS_GLOBALS_WARNINGS                                          \
    namespace {                                                                       \
    Catch::ListenerRegistrar<listenerType> catch_internal_RegistrarFor##listenerType; \
    }                                                                                 \
    CATCH_INTERNAL_STOP_WARNINGS_SUPPRESSION
#else  // CATCH_CONFIG_DISABLE

#define CATCH_REGISTER_REPORTER(name, reporterType)
#define CATCH_REGISTER_LISTENER(listenerType)

#endif  // CATCH_CONFIG_DISABLE

// end catch_reporter_registrars.hpp
// Allow users to base their work off existing reporters
// start catch_reporter_compact.h

namespace Catch {

struct CompactReporter : StreamingReporterBase<CompactReporter> {
    using StreamingReporterBase::StreamingReporterBase;

    ~CompactReporter() override;

    static std::string getDescription();

    void noMatchingTestCases(std::string const &spec) override;

    void assertionStarting(AssertionInfo const &) override;

    bool assertionEnded(AssertionStats const &_assertionStats) override;

    void sectionEnded(SectionStats const &_sectionStats) override;

    void testRunEnded(TestRunStats const &_testRunStats) override;
};

}  // end namespace Catch

// end catch_reporter_compact.h
// start catch_reporter_console.h

#if defined(_MSC_VER)
#pragma warning(push)
#pragma warning(disable : 4061)  // Not all labels are EXPLICITLY handled in  \
                                 // switch Note that 4062 (not all labels are \
                                 // handled and default is missing) is enabled
#endif

namespace Catch {
// Fwd decls
struct SummaryColumn;
class TablePrinter;

struct ConsoleReporter : StreamingReporterBase<ConsoleReporter> {
    std::unique_ptr<TablePrinter> m_tablePrinter;

    ConsoleReporter(ReporterConfig const &config);
    ~ConsoleReporter() override;
    static std::string getDescription();

    void noMatchingTestCases(std::string const &spec) override;

    void reportInvalidArguments(std::string const &arg) override;

    void assertionStarting(AssertionInfo const &) override;

    bool assertionEnded(AssertionStats const &_assertionStats) override;

    void sectionStarting(SectionInfo const &_sectionInfo) override;
    void sectionEnded(SectionStats const &_sectionStats) override;

#if defined(CATCH_CONFIG_ENABLE_BENCHMARKING)
    void benchmarkPreparing(std::string const &name) override;
    void benchmarkStarting(BenchmarkInfo const &info) override;
    void benchmarkEnded(BenchmarkStats<> const &stats) override;
    void benchmarkFailed(std::string const &error) override;
#endif  // CATCH_CONFIG_ENABLE_BENCHMARKING

    void testCaseEnded(TestCaseStats const &_testCaseStats) override;
    void testGroupEnded(TestGroupStats const &_testGroupStats) override;
    void testRunEnded(TestRunStats const &_testRunStats) override;
    void testRunStarting(TestRunInfo const &_testRunInfo) override;

private:
    void lazyPrint();

    void lazyPrintWithoutClosingBenchmarkTable();
    void lazyPrintRunInfo();
    void lazyPrintGroupInfo();
    void printTestCaseAndSectionHeader();

    void printClosedHeader(std::string const &_name);
    void printOpenHeader(std::string const &_name);

    // if string has a : in first line will set indent to follow it on
    // subsequent lines
    void printHeaderString(std::string const &_string, std::size_t indent = 0);

    void printTotals(Totals const &totals);
    void printSummaryRow(std::string const &label,
                         std::vector<SummaryColumn> const &cols,
                         std::size_t row);

    void printTotalsDivider(Totals const &totals);
    void printSummaryDivider();
    void printTestFilters();

private:
    bool m_headerPrinted = false;
};

}  // end namespace Catch

#if defined(_MSC_VER)
#pragma warning(pop)
#endif

// end catch_reporter_console.h
// start catch_reporter_junit.h

// start catch_xmlwriter.h

#include <vector>

namespace Catch {
enum class XmlFormatting {
    None = 0x00,
    Indent = 0x01,
    Newline = 0x02,
};

XmlFormatting operator|(XmlFormatting lhs, XmlFormatting rhs);
XmlFormatting operator&(XmlFormatting lhs, XmlFormatting rhs);

class XmlEncode {
public:
    enum ForWhat { ForTextNodes, ForAttributes };

    XmlEncode(std::string const &str, ForWhat forWhat = ForTextNodes);

    void encodeTo(std::ostream &os) const;

    friend std::ostream &operator<<(std::ostream &os, XmlEncode const &xmlEncode);

private:
    std::string m_str;
    ForWhat m_forWhat;
};

class XmlWriter {
public:
    class ScopedElement {
    public:
        ScopedElement(XmlWriter *writer, XmlFormatting fmt);

        ScopedElement(ScopedElement &&other) noexcept;
        ScopedElement &operator=(ScopedElement &&other) noexcept;

        ~ScopedElement();

        ScopedElement &writeText(std::string const &text,
                                 XmlFormatting fmt = XmlFormatting::Newline |
                                                     XmlFormatting::Indent);

        template <typename T>
        ScopedElement &writeAttribute(std::string const &name, T const &attribute) {
            m_writer->writeAttribute(name, attribute);
            return *this;
        }

    private:
        mutable XmlWriter *m_writer = nullptr;
        XmlFormatting m_fmt;
    };

    XmlWriter(std::ostream &os = Catch::cout());
    ~XmlWriter();

    XmlWriter(XmlWriter const &) = delete;
    XmlWriter &operator=(XmlWriter const &) = delete;

    XmlWriter &startElement(std::string const &name,
                            XmlFormatting fmt = XmlFormatting::Newline | XmlFormatting::Indent);

    ScopedElement scopedElement(std::string const &name,
                                XmlFormatting fmt = XmlFormatting::Newline | XmlFormatting::Indent);

    XmlWriter &endElement(XmlFormatting fmt = XmlFormatting::Newline | XmlFormatting::Indent);

    XmlWriter &writeAttribute(std::string const &name, std::string const &attribute);

    XmlWriter &writeAttribute(std::string const &name, bool attribute);

    template <typename T>
    XmlWriter &writeAttribute(std::string const &name, T const &attribute) {
        ReusableStringStream rss;
        rss << attribute;
        return writeAttribute(name, rss.str());
    }

    XmlWriter &writeText(std::string const &text,
                         XmlFormatting fmt = XmlFormatting::Newline | XmlFormatting::Indent);

    XmlWriter &writeComment(std::string const &text,
                            XmlFormatting fmt = XmlFormatting::Newline | XmlFormatting::Indent);

    void writeStylesheetRef(std::string const &url);

    XmlWriter &writeBlankLine();

    void ensureTagClosed();

private:
    void applyFormatting(XmlFormatting fmt);

    void writeDeclaration();

    void newlineIfNecessary();

    bool m_tagIsOpen = false;
    bool m_needsNewline = false;
    std::vector<std::string> m_tags;
    std::string m_indent;
    std::ostream &m_os;
};

}  // namespace Catch

// end catch_xmlwriter.h
namespace Catch {

class JunitReporter : public CumulativeReporterBase<JunitReporter> {
public:
    JunitReporter(ReporterConfig const &_config);

    ~JunitReporter() override;

    static std::string getDescription();

    void noMatchingTestCases(std::string const & /*spec*/) override;

    void testRunStarting(TestRunInfo const &runInfo) override;

    void testGroupStarting(GroupInfo const &groupInfo) override;

    void testCaseStarting(TestCaseInfo const &testCaseInfo) override;
    bool assertionEnded(AssertionStats const &assertionStats) override;

    void testCaseEnded(TestCaseStats const &testCaseStats) override;

    void testGroupEnded(TestGroupStats const &testGroupStats) override;

    void testRunEndedCumulative() override;

    void writeGroup(TestGroupNode const &groupNode, double suiteTime);

    void writeTestCase(TestCaseNode const &testCaseNode);

    void writeSection(std::string const &className,
                      std::string const &rootName,
                      SectionNode const &sectionNode,
                      bool testOkToFail);

    void writeAssertions(SectionNode const &sectionNode);
    void writeAssertion(AssertionStats const &stats);

    XmlWriter xml;
    Timer suiteTimer;
    std::string stdOutForSuite;
    std::string stdErrForSuite;
    unsigned int unexpectedExceptions = 0;
    bool m_okToFail = false;
};

}  // end namespace Catch

// end catch_reporter_junit.h
// start catch_reporter_xml.h

namespace Catch {
class XmlReporter : public StreamingReporterBase<XmlReporter> {
public:
    XmlReporter(ReporterConfig const &_config);

    ~XmlReporter() override;

    static std::string getDescription();

    virtual std::string getStylesheetRef() const;

    void writeSourceInfo(SourceLineInfo const &sourceInfo);

public:  // StreamingReporterBase
    void noMatchingTestCases(std::string const &s) override;

    void testRunStarting(TestRunInfo const &testInfo) override;

    void testGroupStarting(GroupInfo const &groupInfo) override;

    void testCaseStarting(TestCaseInfo const &testInfo) override;

    void sectionStarting(SectionInfo const &sectionInfo) override;

    void assertionStarting(AssertionInfo const &) override;

    bool assertionEnded(AssertionStats const &assertionStats) override;

    void sectionEnded(SectionStats const &sectionStats) override;

    void testCaseEnded(TestCaseStats const &testCaseStats) override;

    void testGroupEnded(TestGroupStats const &testGroupStats) override;

    void testRunEnded(TestRunStats const &testRunStats) override;

#if defined(CATCH_CONFIG_ENABLE_BENCHMARKING)
    void benchmarkPreparing(std::string const &name) override;
    void benchmarkStarting(BenchmarkInfo const &) override;
    void benchmarkEnded(BenchmarkStats<> const &) override;
    void benchmarkFailed(std::string const &) override;
#endif  // CATCH_CONFIG_ENABLE_BENCHMARKING

private:
    Timer m_testCaseTimer;
    XmlWriter m_xml;
    int m_sectionDepth = 0;
};

}  // end namespace Catch

// end catch_reporter_xml.h

// end catch_external_interfaces.h
#endif

#if defined(CATCH_CONFIG_ENABLE_BENCHMARKING)
// start catch_benchmarking_all.hpp

// A proxy header that includes all of the benchmarking headers to allow
// concise include of the benchmarking features. You should prefer the
// individual includes in standard use.

// start catch_benchmark.hpp

// Benchmark

// start catch_chronometer.hpp

// User-facing chronometer

// start catch_clock.hpp

// Clocks

#include <chrono>
#include <ratio>

namespace Catch {
namespace Benchmark {
template <typename Clock>
using ClockDuration = typename Clock::duration;
template <typename Clock>
using FloatDuration = std::chrono::duration<double, typename Clock::period>;

template <typename Clock>
using TimePoint = typename Clock::time_point;

using default_clock = std::chrono::steady_clock;

template <typename Clock>
struct now {
    TimePoint<Clock> operator()() const { return Clock::now(); }
};

using fp_seconds = std::chrono::duration<double, std::ratio<1>>;
}  // namespace Benchmark
}  // namespace Catch

// end catch_clock.hpp
// start catch_optimizer.hpp

// Hinting the optimizer

#if defined(_MSC_VER)
#include <atomic>  // atomic_thread_fence
#endif

namespace Catch {
namespace Benchmark {
#if defined(__GNUC__) || defined(__clang__)
template <typename T>
inline void keep_memory(T *p) {
    asm volatile("" : : "g"(p) : "memory");
}
inline void keep_memory() { asm volatile("" : : : "memory"); }

namespace Detail {
inline void optimizer_barrier() { keep_memory(); }
}  // namespace Detail
#elif defined(_MSC_VER)

#pragma optimize("", off)
template <typename T>
inline void keep_memory(T *p) {
    // thanks @milleniumbug
    *reinterpret_cast<char volatile *>(p) = *reinterpret_cast<char const volatile *>(p);
}
// TODO equivalent keep_memory()
#pragma optimize("", on)

namespace Detail {
inline void optimizer_barrier() { std::atomic_thread_fence(std::memory_order_seq_cst); }
}  // namespace Detail

#endif

template <typename T>
inline void deoptimize_value(T &&x) {
    keep_memory(&x);
}

template <typename Fn, typename... Args>
inline auto invoke_deoptimized(Fn &&fn, Args &&...args) ->
        typename std::enable_if<!std::is_same<void, decltype(fn(args...))>::value>::type {
    deoptimize_value(std::forward<Fn>(fn)(std::forward<Args...>(args...)));
}

template <typename Fn, typename... Args>
inline auto invoke_deoptimized(Fn &&fn, Args &&...args) ->
        typename std::enable_if<std::is_same<void, decltype(fn(args...))>::value>::type {
    std::forward<Fn>(fn)(std::forward<Args...>(args...));
}
}  // namespace Benchmark
}  // namespace Catch

// end catch_optimizer.hpp
// start catch_complete_invoke.hpp

// Invoke with a special case for void

#include <type_traits>
#include <utility>

namespace Catch {
namespace Benchmark {
namespace Detail {
template <typename T>
struct CompleteType {
    using type = T;
};
template <>
struct CompleteType<void> {
    struct type {};
};

template <typename T>
using CompleteType_t = typename CompleteType<T>::type;

template <typename Result>
struct CompleteInvoker {
    template <typename Fun, typename... Args>
    static Result invoke(Fun &&fun, Args &&...args) {
        return std::forward<Fun>(fun)(std::forward<Args>(args)...);
    }
};
template <>
struct CompleteInvoker<void> {
    template <typename Fun, typename... Args>
    static CompleteType_t<void> invoke(Fun &&fun, Args &&...args) {
        std::forward<Fun>(fun)(std::forward<Args>(args)...);
        return {};
    }
};

// invoke and not return void :(
template <typename Fun, typename... Args>
CompleteType_t<FunctionReturnType<Fun, Args...>> complete_invoke(Fun &&fun, Args &&...args) {
    return CompleteInvoker<FunctionReturnType<Fun, Args...>>::invoke(std::forward<Fun>(fun),
                                                                     std::forward<Args>(args)...);
}

const std::string benchmarkErrorMsg = "a benchmark failed to run successfully";
}  // namespace Detail

template <typename Fun>
Detail::CompleteType_t<FunctionReturnType<Fun>> user_code(Fun &&fun) {
    CATCH_TRY { return Detail::complete_invoke(std::forward<Fun>(fun)); }
    CATCH_CATCH_ALL {
        getResultCapture().benchmarkFailed(translateActiveException());
        CATCH_RUNTIME_ERROR(Detail::benchmarkErrorMsg);
    }
}
}  // namespace Benchmark
}  // namespace Catch

// end catch_complete_invoke.hpp
namespace Catch {
namespace Benchmark {
namespace Detail {
struct ChronometerConcept {
    virtual void start() = 0;
    virtual void finish() = 0;
    virtual ~ChronometerConcept() = default;
};
template <typename Clock>
struct ChronometerModel final : public ChronometerConcept {
    void start() override { started = Clock::now(); }
    void finish() override { finished = Clock::now(); }

    ClockDuration<Clock> elapsed() const { return finished - started; }

    TimePoint<Clock> started;
    TimePoint<Clock> finished;
};
}  // namespace Detail

struct Chronometer {
public:
    template <typename Fun>
    void measure(Fun &&fun) {
        measure(std::forward<Fun>(fun), is_callable<Fun(int)>());
    }

    int runs() const { return k; }

    Chronometer(Detail::ChronometerConcept &meter, int k) : impl(&meter), k(k) {}

private:
    template <typename Fun>
    void measure(Fun &&fun, std::false_type) {
        measure([&fun](int) { return fun(); }, std::true_type());
    }

    template <typename Fun>
    void measure(Fun &&fun, std::true_type) {
        Detail::optimizer_barrier();
        impl->start();
        for (int i = 0; i < k; ++i)
            invoke_deoptimized(fun, i);
        impl->finish();
        Detail::optimizer_barrier();
    }

    Detail::ChronometerConcept *impl;
    int k;
};
}  // namespace Benchmark
}  // namespace Catch

// end catch_chronometer.hpp
// start catch_environment.hpp

// Environment information

namespace Catch {
namespace Benchmark {
template <typename Duration>
struct EnvironmentEstimate {
    Duration mean;
    OutlierClassification outliers;

    template <typename Duration2>
    operator EnvironmentEstimate<Duration2>() const {
        return {mean, outliers};
    }
};
template <typename Clock>
struct Environment {
    using clock_type = Clock;
    EnvironmentEstimate<FloatDuration<Clock>> clock_resolution;
    EnvironmentEstimate<FloatDuration<Clock>> clock_cost;
};
}  // namespace Benchmark
}  // namespace Catch

// end catch_environment.hpp
// start catch_execution_plan.hpp

// Execution plan

// start catch_benchmark_function.hpp

// Dumb std::function implementation for consistent call overhead

#include <cassert>
#include <memory>
#include <type_traits>
#include <utility>

namespace Catch {
namespace Benchmark {
namespace Detail {
template <typename T>
using Decay = typename std::decay<T>::type;
template <typename T, typename U>
struct is_related : std::is_same<Decay<T>, Decay<U>> {};

/// We need to reinvent std::function because every piece of code that might add
/// overhead in a measurement context needs to have consistent performance
/// characteristics so that we can account for it in the measurement.
/// Implementations of std::function with optimizations that aren't always
/// applicable, like small buffer optimizations, are not uncommon. This is
/// effectively an implementation of std::function without any such
/// optimizations; it may be slow, but it is consistently slow.
struct BenchmarkFunction {
private:
    struct callable {
        virtual void call(Chronometer meter) const = 0;
        virtual callable *clone() const = 0;
        virtual ~callable() = default;
    };
    template <typename Fun>
    struct model : public callable {
        model(Fun &&fun) : fun(std::move(fun)) {}
        model(Fun const &fun) : fun(fun) {}

        model<Fun> *clone() const override { return new model<Fun>(*this); }

        void call(Chronometer meter) const override {
            call(meter, is_callable<Fun(Chronometer)>());
        }
        void call(Chronometer meter, std::true_type) const { fun(meter); }
        void call(Chronometer meter, std::false_type) const { meter.measure(fun); }

        Fun fun;
    };

    struct do_nothing {
        void operator()() const {}
    };

    template <typename T>
    BenchmarkFunction(model<T> *c) : f(c) {}

public:
    BenchmarkFunction() : f(new model<do_nothing>{{}}) {}

    template <typename Fun,
              typename std::enable_if<!is_related<Fun, BenchmarkFunction>::value, int>::type = 0>
    BenchmarkFunction(Fun &&fun)
            : f(new model<typename std::decay<Fun>::type>(std::forward<Fun>(fun))) {}

    BenchmarkFunction(BenchmarkFunction &&that) : f(std::move(that.f)) {}

    BenchmarkFunction(BenchmarkFunction const &that) : f(that.f->clone()) {}

    BenchmarkFunction &operator=(BenchmarkFunction &&that) {
        f = std::move(that.f);
        return *this;
    }

    BenchmarkFunction &operator=(BenchmarkFunction const &that) {
        f.reset(that.f->clone());
        return *this;
    }

    void operator()(Chronometer meter) const { f->call(meter); }

private:
    std::unique_ptr<callable> f;
};
}  // namespace Detail
}  // namespace Benchmark
}  // namespace Catch

// end catch_benchmark_function.hpp
// start catch_repeat.hpp

// repeat algorithm

#include <type_traits>
#include <utility>

namespace Catch {
namespace Benchmark {
namespace Detail {
template <typename Fun>
struct repeater {
    void operator()(int k) const {
        for (int i = 0; i < k; ++i) {
            fun();
        }
    }
    Fun fun;
};
template <typename Fun>
repeater<typename std::decay<Fun>::type> repeat(Fun &&fun) {
    return {std::forward<Fun>(fun)};
}
}  // namespace Detail
}  // namespace Benchmark
}  // namespace Catch

// end catch_repeat.hpp
// start catch_run_for_at_least.hpp

// Run a function for a minimum amount of time

// start catch_measure.hpp

// Measure

// start catch_timing.hpp

// Timing

#include <tuple>
#include <type_traits>

namespace Catch {
namespace Benchmark {
template <typename Duration, typename Result>
struct Timing {
    Duration elapsed;
    Result result;
    int iterations;
};
template <typename Clock, typename Func, typename... Args>
using TimingOf =
        Timing<ClockDuration<Clock>, Detail::CompleteType_t<FunctionReturnType<Func, Args...>>>;
}  // namespace Benchmark
}  // namespace Catch

// end catch_timing.hpp
#include <utility>

namespace Catch {
namespace Benchmark {
namespace Detail {
template <typename Clock, typename Fun, typename... Args>
TimingOf<Clock, Fun, Args...> measure(Fun &&fun, Args &&...args) {
    auto start = Clock::now();
    auto &&r = Detail::complete_invoke(fun, std::forward<Args>(args)...);
    auto end = Clock::now();
    auto delta = end - start;
    return {delta, std::forward<decltype(r)>(r), 1};
}
}  // namespace Detail
}  // namespace Benchmark
}  // namespace Catch

// end catch_measure.hpp
#include <type_traits>
#include <utility>

namespace Catch {
namespace Benchmark {
namespace Detail {
template <typename Clock, typename Fun>
TimingOf<Clock, Fun, int> measure_one(Fun &&fun, int iters, std::false_type) {
    return Detail::measure<Clock>(fun, iters);
}
template <typename Clock, typename Fun>
TimingOf<Clock, Fun, Chronometer> measure_one(Fun &&fun, int iters, std::true_type) {
    Detail::ChronometerModel<Clock> meter;
    auto &&result = Detail::complete_invoke(fun, Chronometer(meter, iters));

    return {meter.elapsed(), std::move(result), iters};
}

template <typename Clock, typename Fun>
using run_for_at_least_argument_t =
        typename std::conditional<is_callable<Fun(Chronometer)>::value, Chronometer, int>::type;

struct optimized_away_error : std::exception {
    const char *what() const noexcept override {
        return "could not measure benchmark, maybe it was optimized away";
    }
};

template <typename Clock, typename Fun>
TimingOf<Clock, Fun, run_for_at_least_argument_t<Clock, Fun>>
run_for_at_least(ClockDuration<Clock> how_long, int seed, Fun &&fun) {
    auto iters = seed;
    while (iters < (1 << 30)) {
        auto &&Timing = measure_one<Clock>(fun, iters, is_callable<Fun(Chronometer)>());

        if (Timing.elapsed >= how_long) {
            return {Timing.elapsed, std::move(Timing.result), iters};
        }
        iters *= 2;
    }
    Catch::throw_exception(optimized_away_error{});
}
}  // namespace Detail
}  // namespace Benchmark
}  // namespace Catch

// end catch_run_for_at_least.hpp
#include <algorithm>
#include <iterator>

namespace Catch {
namespace Benchmark {
template <typename Duration>
struct ExecutionPlan {
    int iterations_per_sample;
    Duration estimated_duration;
    Detail::BenchmarkFunction benchmark;
    Duration warmup_time;
    int warmup_iterations;

    template <typename Duration2>
    operator ExecutionPlan<Duration2>() const {
        return {iterations_per_sample, estimated_duration, benchmark, warmup_time,
                warmup_iterations};
    }

    template <typename Clock>
    std::vector<FloatDuration<Clock>> run(const IConfig &cfg,
                                          Environment<FloatDuration<Clock>> env) const {
        // warmup a bit
        Detail::run_for_at_least<Clock>(
                std::chrono::duration_cast<ClockDuration<Clock>>(warmup_time), warmup_iterations,
                Detail::repeat(now<Clock>{}));

        std::vector<FloatDuration<Clock>> times;
        times.reserve(cfg.benchmarkSamples());
        std::generate_n(std::back_inserter(times), cfg.benchmarkSamples(), [this, env] {
            Detail::ChronometerModel<Clock> model;
            this->benchmark(Chronometer(model, iterations_per_sample));
            auto sample_time = model.elapsed() - env.clock_cost.mean;
            if (sample_time < FloatDuration<Clock>::zero())
                sample_time = FloatDuration<Clock>::zero();
            return sample_time / iterations_per_sample;
        });
        return times;
    }
};
}  // namespace Benchmark
}  // namespace Catch

// end catch_execution_plan.hpp
// start catch_estimate_clock.hpp

// Environment measurement

// start catch_stats.hpp

// Statistical analysis tools

#include <algorithm>
#include <cmath>
#include <cstddef>
#include <functional>
#include <iterator>
#include <numeric>
#include <random>
#include <tuple>
#include <utility>
#include <vector>

namespace Catch {
namespace Benchmark {
namespace Detail {
using sample = std::vector<double>;

double weighted_average_quantile(int k,
                                 int q,
                                 std::vector<double>::iterator first,
                                 std::vector<double>::iterator last);

template <typename Iterator>
OutlierClassification classify_outliers(Iterator first, Iterator last) {
    std::vector<double> copy(first, last);

    auto q1 = weighted_average_quantile(1, 4, copy.begin(), copy.end());
    auto q3 = weighted_average_quantile(3, 4, copy.begin(), copy.end());
    auto iqr = q3 - q1;
    auto los = q1 - (iqr * 3.);
    auto lom = q1 - (iqr * 1.5);
    auto him = q3 + (iqr * 1.5);
    auto his = q3 + (iqr * 3.);

    OutlierClassification o;
    for (; first != last; ++first) {
        auto &&t = *first;
        if (t < los)
            ++o.low_severe;
        else if (t < lom)
            ++o.low_mild;
        else if (t > his)
            ++o.high_severe;
        else if (t > him)
            ++o.high_mild;
        ++o.samples_seen;
    }
    return o;
}

template <typename Iterator>
double mean(Iterator first, Iterator last) {
    auto count = last - first;
    double sum = std::accumulate(first, last, 0.);
    return sum / count;
}

template <typename URng, typename Iterator, typename Estimator>
sample resample(URng &rng, int resamples, Iterator first, Iterator last, Estimator &estimator) {
    auto n = last - first;
    std::uniform_int_distribution<decltype(n)> dist(0, n - 1);

    sample out;
    out.reserve(resamples);
    std::generate_n(std::back_inserter(out), resamples, [n, first, &estimator, &dist, &rng] {
        std::vector<double> resampled;
        resampled.reserve(n);
        std::generate_n(std::back_inserter(resampled), n,
                        [first, &dist, &rng] { return first[dist(rng)]; });
        return estimator(resampled.begin(), resampled.end());
    });
    std::sort(out.begin(), out.end());
    return out;
}

template <typename Estimator, typename Iterator>
sample jackknife(Estimator &&estimator, Iterator first, Iterator last) {
    auto n = last - first;
    auto second = std::next(first);
    sample results;
    results.reserve(n);

    for (auto it = first; it != last; ++it) {
        std::iter_swap(it, first);
        results.push_back(estimator(second, last));
    }

    return results;
}

inline double normal_cdf(double x) { return std::erfc(-x / std::sqrt(2.0)) / 2.0; }

double erfc_inv(double x);

double normal_quantile(double p);

template <typename Iterator, typename Estimator>
Estimate<double> bootstrap(double confidence_level,
                           Iterator first,
                           Iterator last,
                           sample const &resample,
                           Estimator &&estimator) {
    auto n_samples = last - first;

    double point = estimator(first, last);
    // Degenerate case with a single sample
    if (n_samples == 1)
        return {point, point, point, confidence_level};

    sample jack = jackknife(estimator, first, last);
    double jack_mean = mean(jack.begin(), jack.end());
    double sum_squares, sum_cubes;
    std::tie(sum_squares, sum_cubes) = std::accumulate(
            jack.begin(), jack.end(), std::make_pair(0., 0.),
            [jack_mean](std::pair<double, double> sqcb, double x) -> std::pair<double, double> {
                auto d = jack_mean - x;
                auto d2 = d * d;
                auto d3 = d2 * d;
                return {sqcb.first + d2, sqcb.second + d3};
            });

    double accel = sum_cubes / (6 * std::pow(sum_squares, 1.5));
    int n = static_cast<int>(resample.size());
    double prob_n = std::count_if(resample.begin(), resample.end(),
                                  [point](double x) { return x < point; }) /
                    (double)n;
    // degenerate case with uniform samples
    if (prob_n == 0)
        return {point, point, point, confidence_level};

    double bias = normal_quantile(prob_n);
    double z1 = normal_quantile((1. - confidence_level) / 2.);

    auto cumn = [n](double x) -> int { return std::lround(normal_cdf(x) * n); };
    auto a = [bias, accel](double b) { return bias + b / (1. - accel * b); };
    double b1 = bias + z1;
    double b2 = bias - z1;
    double a1 = a(b1);
    double a2 = a(b2);
    auto lo = (std::max)(cumn(a1), 0);
    auto hi = (std::min)(cumn(a2), n - 1);

    return {point, resample[lo], resample[hi], confidence_level};
}

double outlier_variance(Estimate<double> mean, Estimate<double> stddev, int n);

struct bootstrap_analysis {
    Estimate<double> mean;
    Estimate<double> standard_deviation;
    double outlier_variance;
};

bootstrap_analysis analyse_samples(double confidence_level,
                                   int n_resamples,
                                   std::vector<double>::iterator first,
                                   std::vector<double>::iterator last);
}  // namespace Detail
}  // namespace Benchmark
}  // namespace Catch

// end catch_stats.hpp
#include <algorithm>
#include <cmath>
#include <iterator>
#include <tuple>
#include <vector>

namespace Catch {
namespace Benchmark {
namespace Detail {
template <typename Clock>
std::vector<double> resolution(int k) {
    std::vector<TimePoint<Clock>> times;
    times.reserve(k + 1);
    std::generate_n(std::back_inserter(times), k + 1, now<Clock>{});

    std::vector<double> deltas;
    deltas.reserve(k);
    std::transform(std::next(times.begin()), times.end(), times.begin(), std::back_inserter(deltas),
                   [](TimePoint<Clock> a, TimePoint<Clock> b) {
                       return static_cast<double>((a - b).count());
                   });

    return deltas;
}

const auto warmup_iterations = 10000;
const auto warmup_time = std::chrono::milliseconds(100);
const auto minimum_ticks = 1000;
const auto warmup_seed = 10000;
const auto clock_resolution_estimation_time = std::chrono::milliseconds(500);
const auto clock_cost_estimation_time_limit = std::chrono::seconds(1);
const auto clock_cost_estimation_tick_limit = 100000;
const auto clock_cost_estimation_time = std::chrono::milliseconds(10);
const auto clock_cost_estimation_iterations = 10000;

template <typename Clock>
int warmup() {
    return run_for_at_least<Clock>(std::chrono::duration_cast<ClockDuration<Clock>>(warmup_time),
                                   warmup_seed, &resolution<Clock>)
            .iterations;
}
template <typename Clock>
EnvironmentEstimate<FloatDuration<Clock>> estimate_clock_resolution(int iterations) {
    auto r = run_for_at_least<Clock>(std::chrono::duration_cast<ClockDuration<Clock>>(
                                             clock_resolution_estimation_time),
                                     iterations, &resolution<Clock>)
                     .result;
    return {
            FloatDuration<Clock>(mean(r.begin(), r.end())),
            classify_outliers(r.begin(), r.end()),
    };
}
template <typename Clock>
EnvironmentEstimate<FloatDuration<Clock>> estimate_clock_cost(FloatDuration<Clock> resolution) {
    auto time_limit = (std::min)(resolution * clock_cost_estimation_tick_limit,
                                 FloatDuration<Clock>(clock_cost_estimation_time_limit));
    auto time_clock = [](int k) {
        return Detail::measure<Clock>([k] {
                   for (int i = 0; i < k; ++i) {
                       volatile auto ignored = Clock::now();
                       (void)ignored;
                   }
               })
                .elapsed;
    };
    time_clock(1);
    int iters = clock_cost_estimation_iterations;
    auto &&r = run_for_at_least<Clock>(
            std::chrono::duration_cast<ClockDuration<Clock>>(clock_cost_estimation_time), iters,
            time_clock);
    std::vector<double> times;
    int nsamples = static_cast<int>(std::ceil(time_limit / r.elapsed));
    times.reserve(nsamples);
    std::generate_n(std::back_inserter(times), nsamples, [time_clock, &r] {
        return static_cast<double>((time_clock(r.iterations) / r.iterations).count());
    });
    return {
            FloatDuration<Clock>(mean(times.begin(), times.end())),
            classify_outliers(times.begin(), times.end()),
    };
}

template <typename Clock>
Environment<FloatDuration<Clock>> measure_environment() {
    static Environment<FloatDuration<Clock>> *env = nullptr;
    if (env) {
        return *env;
    }

    auto iters = Detail::warmup<Clock>();
    auto resolution = Detail::estimate_clock_resolution<Clock>(iters);
    auto cost = Detail::estimate_clock_cost<Clock>(resolution.mean);

    env = new Environment<FloatDuration<Clock>>{resolution, cost};
    return *env;
}
}  // namespace Detail
}  // namespace Benchmark
}  // namespace Catch

// end catch_estimate_clock.hpp
// start catch_analyse.hpp

// Run and analyse one benchmark

// start catch_sample_analysis.hpp

// Benchmark results

#include <algorithm>
#include <iterator>
#include <string>
#include <vector>

namespace Catch {
namespace Benchmark {
template <typename Duration>
struct SampleAnalysis {
    std::vector<Duration> samples;
    Estimate<Duration> mean;
    Estimate<Duration> standard_deviation;
    OutlierClassification outliers;
    double outlier_variance;

    template <typename Duration2>
    operator SampleAnalysis<Duration2>() const {
        std::vector<Duration2> samples2;
        samples2.reserve(samples.size());
        std::transform(samples.begin(), samples.end(), std::back_inserter(samples2),
                       [](Duration d) { return Duration2(d); });
        return {
                std::move(samples2), mean, standard_deviation, outliers, outlier_variance,
        };
    }
};
}  // namespace Benchmark
}  // namespace Catch

// end catch_sample_analysis.hpp
#include <algorithm>
#include <iterator>
#include <vector>

namespace Catch {
namespace Benchmark {
namespace Detail {
template <typename Duration, typename Iterator>
SampleAnalysis<Duration> analyse(const IConfig &cfg,
                                 Environment<Duration>,
                                 Iterator first,
                                 Iterator last) {
    if (!cfg.benchmarkNoAnalysis()) {
        std::vector<double> samples;
        samples.reserve(last - first);
        std::transform(first, last, std::back_inserter(samples),
                       [](Duration d) { return d.count(); });

        auto analysis = Catch::Benchmark::Detail::analyse_samples(cfg.benchmarkConfidenceInterval(),
                                                                  cfg.benchmarkResamples(),
                                                                  samples.begin(), samples.end());
        auto outliers = Catch::Benchmark::Detail::classify_outliers(samples.begin(), samples.end());

        auto wrap_estimate = [](Estimate<double> e) {
            return Estimate<Duration>{
                    Duration(e.point),
                    Duration(e.lower_bound),
                    Duration(e.upper_bound),
                    e.confidence_interval,
            };
        };
        std::vector<Duration> samples2;
        samples2.reserve(samples.size());
        std::transform(samples.begin(), samples.end(), std::back_inserter(samples2),
                       [](double d) { return Duration(d); });
        return {
                std::move(samples2),
                wrap_estimate(analysis.mean),
                wrap_estimate(analysis.standard_deviation),
                outliers,
                analysis.outlier_variance,
        };
    } else {
        std::vector<Duration> samples;
        samples.reserve(last - first);

        Duration mean = Duration(0);
        int i = 0;
        for (auto it = first; it < last; ++it, ++i) {
            samples.push_back(Duration(*it));
            mean += Duration(*it);
        }
        mean /= i;

        return {std::move(samples), Estimate<Duration>{mean, mean, mean, 0.0},
                Estimate<Duration>{Duration(0), Duration(0), Duration(0), 0.0},
                OutlierClassification{}, 0.0};
    }
}
}  // namespace Detail
}  // namespace Benchmark
}  // namespace Catch

// end catch_analyse.hpp
#include <algorithm>
#include <cmath>
#include <functional>
#include <string>
#include <vector>

namespace Catch {
namespace Benchmark {
struct Benchmark {
    Benchmark(std::string &&name) : name(std::move(name)) {}

    template <class FUN>
    Benchmark(std::string &&name, FUN &&func) : fun(std::move(func)), name(std::move(name)) {}

    template <typename Clock>
    ExecutionPlan<FloatDuration<Clock>> prepare(const IConfig &cfg,
                                                Environment<FloatDuration<Clock>> env) const {
        auto min_time = env.clock_resolution.mean * Detail::minimum_ticks;
        auto run_time =
                std::max(min_time,
                         std::chrono::duration_cast<decltype(min_time)>(cfg.benchmarkWarmupTime()));
        auto &&test = Detail::run_for_at_least<Clock>(
                std::chrono::duration_cast<ClockDuration<Clock>>(run_time), 1, fun);
        int new_iters = static_cast<int>(std::ceil(min_time * test.iterations / test.elapsed));
        return {new_iters, test.elapsed / test.iterations * new_iters * cfg.benchmarkSamples(), fun,
                std::chrono::duration_cast<FloatDuration<Clock>>(cfg.benchmarkWarmupTime()),
                Detail::warmup_iterations};
    }

    template <typename Clock = default_clock>
    void run() {
        IConfigPtr cfg = getCurrentContext().getConfig();

        auto env = Detail::measure_environment<Clock>();

        getResultCapture().benchmarkPreparing(name);
        CATCH_TRY {
            auto plan = user_code([&] { return prepare<Clock>(*cfg, env); });

            BenchmarkInfo info{name,
                               plan.estimated_duration.count(),
                               plan.iterations_per_sample,
                               cfg->benchmarkSamples(),
                               cfg->benchmarkResamples(),
                               env.clock_resolution.mean.count(),
                               env.clock_cost.mean.count()};

            getResultCapture().benchmarkStarting(info);

            auto samples = user_code([&] { return plan.template run<Clock>(*cfg, env); });

            auto analysis = Detail::analyse(*cfg, env, samples.begin(), samples.end());
            BenchmarkStats<FloatDuration<Clock>> stats{info,
                                                       analysis.samples,
                                                       analysis.mean,
                                                       analysis.standard_deviation,
                                                       analysis.outliers,
                                                       analysis.outlier_variance};
            getResultCapture().benchmarkEnded(stats);
        }
        CATCH_CATCH_ALL {
            if (translateActiveException() !=
                Detail::benchmarkErrorMsg)  // benchmark errors have been reported,
                                            // otherwise rethrow.
                std::rethrow_exception(std::current_exception());
        }
    }

    // sets lambda to be used in fun *and* executes benchmark!
    template <typename Fun,
              typename std::enable_if<!Detail::is_related<Fun, Benchmark>::value, int>::type = 0>
    Benchmark &operator=(Fun func) {
        fun = Detail::BenchmarkFunction(func);
        run();
        return *this;
    }

    explicit operator bool() { return true; }

private:
    Detail::BenchmarkFunction fun;
    std::string name;
};
}  // namespace Benchmark
}  // namespace Catch

#define INTERNAL_CATCH_GET_1_ARG(arg1, arg2, ...) arg1
#define INTERNAL_CATCH_GET_2_ARG(arg1, arg2, ...) arg2

#define INTERNAL_CATCH_BENCHMARK(BenchmarkName, name, benchmarkIndex) \
    if (Catch::Benchmark::Benchmark BenchmarkName{name})              \
    BenchmarkName = [&](int benchmarkIndex)

#define INTERNAL_CATCH_BENCHMARK_ADVANCED(BenchmarkName, name) \
    if (Catch::Benchmark::Benchmark BenchmarkName{name})       \
    BenchmarkName = [&]

// end catch_benchmark.hpp
// start catch_constructor.hpp

// Constructor and destructor helpers

#include <type_traits>

namespace Catch {
namespace Benchmark {
namespace Detail {
template <typename T, bool Destruct>
struct ObjectStorage {
    using TStorage = typename std::aligned_storage<sizeof(T), std::alignment_of<T>::value>::type;

    ObjectStorage() : data() {}

    ObjectStorage(const ObjectStorage &other) { new (&data) T(other.stored_object()); }

    ObjectStorage(ObjectStorage &&other) { new (&data) T(std::move(other.stored_object())); }

    ~ObjectStorage() { destruct_on_exit<T>(); }

    template <typename... Args>
    void construct(Args &&...args) {
        new (&data) T(std::forward<Args>(args)...);
    }

    template <bool AllowManualDestruction = !Destruct>
    typename std::enable_if<AllowManualDestruction>::type destruct() {
        stored_object().~T();
    }

private:
    // If this is a constructor benchmark, destruct the underlying object
    template <typename U>
    void destruct_on_exit(typename std::enable_if<Destruct, U>::type * = 0) {
        destruct<true>();
    }
    // Otherwise, don't
    template <typename U>
    void destruct_on_exit(typename std::enable_if<!Destruct, U>::type * = 0) {}

    T &stored_object() { return *static_cast<T *>(static_cast<void *>(&data)); }

    T const &stored_object() const { return *static_cast<T *>(static_cast<void *>(&data)); }

    TStorage data;
};
}  // namespace Detail

template <typename T>
using storage_for = Detail::ObjectStorage<T, true>;

template <typename T>
using destructable_object = Detail::ObjectStorage<T, false>;
}  // namespace Benchmark
}  // namespace Catch

// end catch_constructor.hpp
// end catch_benchmarking_all.hpp
#endif

#endif  // ! CATCH_CONFIG_IMPL_ONLY

#ifdef CATCH_IMPL
// start catch_impl.hpp

#ifdef __clang__
#pragma clang diagnostic push
#pragma clang diagnostic ignored "-Wweak-vtables"
#endif

// Keep these here for external reporters
// start catch_test_case_tracker.h

#include <memory>
#include <string>
#include <vector>

namespace Catch {
namespace TestCaseTracking {

struct NameAndLocation {
    std::string name;
    SourceLineInfo location;

    NameAndLocation(std::string const &_name, SourceLineInfo const &_location);
    friend bool operator==(NameAndLocation const &lhs, NameAndLocation const &rhs) {
        return lhs.name == rhs.name && lhs.location == rhs.location;
    }
};

class ITracker;

using ITrackerPtr = std::shared_ptr<ITracker>;

class ITracker {
    NameAndLocation m_nameAndLocation;

public:
    ITracker(NameAndLocation const &nameAndLoc) : m_nameAndLocation(nameAndLoc) {}

    // static queries
    NameAndLocation const &nameAndLocation() const { return m_nameAndLocation; }

    virtual ~ITracker();

    // dynamic queries
    virtual bool isComplete() const = 0;  // Successfully completed or failed
    virtual bool isSuccessfullyCompleted() const = 0;
    virtual bool isOpen() const = 0;  // Started but not complete
    virtual bool hasChildren() const = 0;
    virtual bool hasStarted() const = 0;

    virtual ITracker &parent() = 0;

    // actions
    virtual void close() = 0;  // Successfully complete
    virtual void fail() = 0;
    virtual void markAsNeedingAnotherRun() = 0;

    virtual void addChild(ITrackerPtr const &child) = 0;
    virtual ITrackerPtr findChild(NameAndLocation const &nameAndLocation) = 0;
    virtual void openChild() = 0;

    // Debug/ checking
    virtual bool isSectionTracker() const = 0;
    virtual bool isGeneratorTracker() const = 0;
};

class TrackerContext {
    enum RunState { NotStarted, Executing, CompletedCycle };

    ITrackerPtr m_rootTracker;
    ITracker *m_currentTracker = nullptr;
    RunState m_runState = NotStarted;

public:
    ITracker &startRun();
    void endRun();

    void startCycle();
    void completeCycle();

    bool completedCycle() const;
    ITracker &currentTracker();
    void setCurrentTracker(ITracker *tracker);
};

class TrackerBase : public ITracker {
protected:
    enum CycleState {
        NotStarted,
        Executing,
        ExecutingChildren,
        NeedsAnotherRun,
        CompletedSuccessfully,
        Failed
    };

    using Children = std::vector<ITrackerPtr>;
    TrackerContext &m_ctx;
    ITracker *m_parent;
    Children m_children;
    CycleState m_runState = NotStarted;

public:
    TrackerBase(NameAndLocation const &nameAndLocation, TrackerContext &ctx, ITracker *parent);

    bool isComplete() const override;
    bool isSuccessfullyCompleted() const override;
    bool isOpen() const override;
    bool hasChildren() const override;
    bool hasStarted() const override { return m_runState != NotStarted; }

    void addChild(ITrackerPtr const &child) override;

    ITrackerPtr findChild(NameAndLocation const &nameAndLocation) override;
    ITracker &parent() override;

    void openChild() override;

    bool isSectionTracker() const override;
    bool isGeneratorTracker() const override;

    void open();

    void close() override;
    void fail() override;
    void markAsNeedingAnotherRun() override;

private:
    void moveToParent();
    void moveToThis();
};

class SectionTracker : public TrackerBase {
    std::vector<std::string> m_filters;
    std::string m_trimmed_name;

public:
    SectionTracker(NameAndLocation const &nameAndLocation, TrackerContext &ctx, ITracker *parent);

    bool isSectionTracker() const override;

    bool isComplete() const override;

    static SectionTracker &acquire(TrackerContext &ctx, NameAndLocation const &nameAndLocation);

    void tryOpen();

    void addInitialFilters(std::vector<std::string> const &filters);
    void addNextFilters(std::vector<std::string> const &filters);
    //! Returns filters active in this tracker
    std::vector<std::string> const &getFilters() const;
    //! Returns whitespace-trimmed name of the tracked section
    std::string const &trimmedName() const;
};

}  // namespace TestCaseTracking

using TestCaseTracking::ITracker;
using TestCaseTracking::SectionTracker;
using TestCaseTracking::TrackerContext;

}  // namespace Catch

// end catch_test_case_tracker.h

// start catch_leak_detector.h

namespace Catch {

struct LeakDetector {
    LeakDetector();
    ~LeakDetector();
};

}  // namespace Catch
// end catch_leak_detector.h
// Cpp files will be included in the single-header file here
// start catch_stats.cpp

// Statistical analysis tools

#if defined(CATCH_CONFIG_ENABLE_BENCHMARKING)

#include <cassert>
#include <random>

#if defined(CATCH_CONFIG_USE_ASYNC)
#include <future>
#endif

namespace {
double erf_inv(double x) {
    // Code accompanying the article "Approximating the erfinv function" in GPU
    // Computing Gems, Volume 2
    double w, p;

    w = -log((1.0 - x) * (1.0 + x));

    if (w < 6.250000) {
        w = w - 3.125000;
        p = -3.6444120640178196996e-21;
        p = -1.685059138182016589e-19 + p * w;
        p = 1.2858480715256400167e-18 + p * w;
        p = 1.115787767802518096e-17 + p * w;
        p = -1.333171662854620906e-16 + p * w;
        p = 2.0972767875968561637e-17 + p * w;
        p = 6.6376381343583238325e-15 + p * w;
        p = -4.0545662729752068639e-14 + p * w;
        p = -8.1519341976054721522e-14 + p * w;
        p = 2.6335093153082322977e-12 + p * w;
        p = -1.2975133253453532498e-11 + p * w;
        p = -5.4154120542946279317e-11 + p * w;
        p = 1.051212273321532285e-09 + p * w;
        p = -4.1126339803469836976e-09 + p * w;
        p = -2.9070369957882005086e-08 + p * w;
        p = 4.2347877827932403518e-07 + p * w;
        p = -1.3654692000834678645e-06 + p * w;
        p = -1.3882523362786468719e-05 + p * w;
        p = 0.0001867342080340571352 + p * w;
        p = -0.00074070253416626697512 + p * w;
        p = -0.0060336708714301490533 + p * w;
        p = 0.24015818242558961693 + p * w;
        p = 1.6536545626831027356 + p * w;
    } else if (w < 16.000000) {
        w = sqrt(w) - 3.250000;
        p = 2.2137376921775787049e-09;
        p = 9.0756561938885390979e-08 + p * w;
        p = -2.7517406297064545428e-07 + p * w;
        p = 1.8239629214389227755e-08 + p * w;
        p = 1.5027403968909827627e-06 + p * w;
        p = -4.013867526981545969e-06 + p * w;
        p = 2.9234449089955446044e-06 + p * w;
        p = 1.2475304481671778723e-05 + p * w;
        p = -4.7318229009055733981e-05 + p * w;
        p = 6.8284851459573175448e-05 + p * w;
        p = 2.4031110387097893999e-05 + p * w;
        p = -0.0003550375203628474796 + p * w;
        p = 0.00095328937973738049703 + p * w;
        p = -0.0016882755560235047313 + p * w;
        p = 0.0024914420961078508066 + p * w;
        p = -0.0037512085075692412107 + p * w;
        p = 0.005370914553590063617 + p * w;
        p = 1.0052589676941592334 + p * w;
        p = 3.0838856104922207635 + p * w;
    } else {
        w = sqrt(w) - 5.000000;
        p = -2.7109920616438573243e-11;
        p = -2.5556418169965252055e-10 + p * w;
        p = 1.5076572693500548083e-09 + p * w;
        p = -3.7894654401267369937e-09 + p * w;
        p = 7.6157012080783393804e-09 + p * w;
        p = -1.4960026627149240478e-08 + p * w;
        p = 2.9147953450901080826e-08 + p * w;
        p = -6.7711997758452339498e-08 + p * w;
        p = 2.2900482228026654717e-07 + p * w;
        p = -9.9298272942317002539e-07 + p * w;
        p = 4.5260625972231537039e-06 + p * w;
        p = -1.9681778105531670567e-05 + p * w;
        p = 7.5995277030017761139e-05 + p * w;
        p = -0.00021503011930044477347 + p * w;
        p = -0.00013871931833623122026 + p * w;
        p = 1.0103004648645343977 + p * w;
        p = 4.8499064014085844221 + p * w;
    }
    return p * x;
}

double standard_deviation(std::vector<double>::iterator first, std::vector<double>::iterator last) {
    auto m = Catch::Benchmark::Detail::mean(first, last);
    double variance = std::accumulate(first, last, 0.,
                                      [m](double a, double b) {
                                          double diff = b - m;
                                          return a + diff * diff;
                                      }) /
                      (last - first);
    return std::sqrt(variance);
}

}  // namespace

namespace Catch {
namespace Benchmark {
namespace Detail {

double weighted_average_quantile(int k,
                                 int q,
                                 std::vector<double>::iterator first,
                                 std::vector<double>::iterator last) {
    auto count = last - first;
    double idx = (count - 1) * k / static_cast<double>(q);
    int j = static_cast<int>(idx);
    double g = idx - j;
    std::nth_element(first, first + j, last);
    auto xj = first[j];
    if (g == 0)
        return xj;

    auto xj1 = *std::min_element(first + (j + 1), last);
    return xj + g * (xj1 - xj);
}

double erfc_inv(double x) { return erf_inv(1.0 - x); }

double normal_quantile(double p) {
    static const double ROOT_TWO = std::sqrt(2.0);

    double result = 0.0;
    assert(p >= 0 && p <= 1);
    if (p < 0 || p > 1) {
        return result;
    }

    result = -erfc_inv(2.0 * p);
    // result *= normal distribution standard deviation (1.0) * sqrt(2)
    result *= /*sd * */ ROOT_TWO;
    // result += normal disttribution mean (0)
    return result;
}

double outlier_variance(Estimate<double> mean, Estimate<double> stddev, int n) {
    double sb = stddev.point;
    double mn = mean.point / n;
    double mg_min = mn / 2.;
    double sg = (std::min)(mg_min / 4., sb / std::sqrt(n));
    double sg2 = sg * sg;
    double sb2 = sb * sb;

    auto c_max = [n, mn, sb2, sg2](double x) -> double {
        double k = mn - x;
        double d = k * k;
        double nd = n * d;
        double k0 = -n * nd;
        double k1 = sb2 - n * sg2 + nd;
        double det = k1 * k1 - 4 * sg2 * k0;
        return (int)(-2. * k0 / (k1 + std::sqrt(det)));
    };

    auto var_out = [n, sb2, sg2](double c) {
        double nc = n - c;
        return (nc / n) * (sb2 - nc * sg2);
    };

    return (std::min)(var_out(1), var_out((std::min)(c_max(0.), c_max(mg_min)))) / sb2;
}

bootstrap_analysis analyse_samples(double confidence_level,
                                   int n_resamples,
                                   std::vector<double>::iterator first,
                                   std::vector<double>::iterator last) {
    CATCH_INTERNAL_START_WARNINGS_SUPPRESSION
    CATCH_INTERNAL_SUPPRESS_GLOBALS_WARNINGS
    static std::random_device entropy;
    CATCH_INTERNAL_STOP_WARNINGS_SUPPRESSION

    auto n = static_cast<int>(
            last - first);  // seriously, one can't use integral types without hell in C++

    auto mean = &Detail::mean<std::vector<double>::iterator>;
    auto stddev = &standard_deviation;

#if defined(CATCH_CONFIG_USE_ASYNC)
    auto Estimate = [=](double (*f)(std::vector<double>::iterator, std::vector<double>::iterator)) {
        auto seed = entropy();
        return std::async(std::launch::async, [=] {
            std::mt19937 rng(seed);
            auto resampled = resample(rng, n_resamples, first, last, f);
            return bootstrap(confidence_level, first, last, resampled, f);
        });
    };

    auto mean_future = Estimate(mean);
    auto stddev_future = Estimate(stddev);

    auto mean_estimate = mean_future.get();
    auto stddev_estimate = stddev_future.get();
#else
    auto Estimate = [=](double (*f)(std::vector<double>::iterator, std::vector<double>::iterator)) {
        auto seed = entropy();
        std::mt19937 rng(seed);
        auto resampled = resample(rng, n_resamples, first, last, f);
        return bootstrap(confidence_level, first, last, resampled, f);
    };

    auto mean_estimate = Estimate(mean);
    auto stddev_estimate = Estimate(stddev);
#endif  // CATCH_USE_ASYNC

    double outlier_variance = Detail::outlier_variance(mean_estimate, stddev_estimate, n);

    return {mean_estimate, stddev_estimate, outlier_variance};
}
}  // namespace Detail
}  // namespace Benchmark
}  // namespace Catch

#endif  // CATCH_CONFIG_ENABLE_BENCHMARKING
// end catch_stats.cpp
// start catch_approx.cpp

#include <cmath>
#include <limits>

namespace {

// Performs equivalent check of std::fabs(lhs - rhs) <= margin
// But without the subtraction to allow for INFINITY in comparison
bool marginComparison(double lhs, double rhs, double margin) {
    return (lhs + margin >= rhs) && (rhs + margin >= lhs);
}

}  // namespace

namespace Catch {
namespace Detail {

Approx::Approx(double value)
        : m_epsilon(std::numeric_limits<float>::epsilon() * 100),
          m_margin(0.0),
          m_scale(0.0),
          m_value(value) {}

Approx Approx::custom() { return Approx(0); }

Approx Approx::operator-() const {
    auto temp(*this);
    temp.m_value = -temp.m_value;
    return temp;
}

std::string Approx::toString() const {
    ReusableStringStream rss;
    rss << "Approx( " << ::Catch::Detail::stringify(m_value) << " )";
    return rss.str();
}

bool Approx::equalityComparisonImpl(const double other) const {
    // First try with fixed margin, then compute margin based on epsilon, scale
    // and Approx's value Thanks to Richard Harris for his help refining the
    // scaled margin value
    return marginComparison(m_value, other, m_margin) ||
           marginComparison(m_value, other,
                            m_epsilon * (m_scale + std::fabs(std::isinf(m_value) ? 0 : m_value)));
}

void Approx::setMargin(double newMargin) {
    CATCH_ENFORCE(newMargin >= 0,
                  "Invalid Approx::margin: " << newMargin << '.'
                                             << " Approx::Margin has to be non-negative.");
    m_margin = newMargin;
}

void Approx::setEpsilon(double newEpsilon) {
    CATCH_ENFORCE(newEpsilon >= 0 && newEpsilon <= 1.0,
                  "Invalid Approx::epsilon: " << newEpsilon << '.'
                                              << " Approx::epsilon has to be in [0, 1]");
    m_epsilon = newEpsilon;
}

}  // end namespace Detail

namespace literals {
Detail::Approx operator"" _a(long double val) { return Detail::Approx(val); }
Detail::Approx operator"" _a(unsigned long long val) { return Detail::Approx(val); }
}  // end namespace literals

std::string StringMaker<Catch::Detail::Approx>::convert(Catch::Detail::Approx const &value) {
    return value.toString();
}

}  // end namespace Catch
// end catch_approx.cpp
// start catch_assertionhandler.cpp

// start catch_debugger.h

namespace Catch {
bool isDebuggerActive();
}

#ifdef CATCH_PLATFORM_MAC

#if defined(__i386__) || defined(__x86_64__)
#define CATCH_TRAP() __asm__("int $3\n" : :) /* NOLINT */
#elif defined(__aarch64__)
#define CATCH_TRAP() __asm__(".inst 0xd4200000")
#endif

#elif defined(CATCH_PLATFORM_IPHONE)

// use inline assembler
#if defined(__i386__) || defined(__x86_64__)
#define CATCH_TRAP() __asm__("int $3")
#elif defined(__aarch64__)
#define CATCH_TRAP() __asm__(".inst 0xd4200000")
#elif defined(__arm__) && !defined(__thumb__)
#define CATCH_TRAP() __asm__(".inst 0xe7f001f0")
#elif defined(__arm__) && defined(__thumb__)
#define CATCH_TRAP() __asm__(".inst 0xde01")
#endif

#elif defined(CATCH_PLATFORM_LINUX)
// If we can use inline assembler, do it because this allows us to break
// directly at the location of the failing check instead of breaking inside
// raise() called from it, i.e. one stack frame below.
#if defined(__GNUC__) && (defined(__i386) || defined(__x86_64))
#define CATCH_TRAP() asm volatile("int $3") /* NOLINT */
#else                                       // Fall back to the generic way.
#include <signal.h>

#define CATCH_TRAP() raise(SIGTRAP)
#endif
#elif defined(_MSC_VER)
#define CATCH_TRAP() __debugbreak()
#elif defined(__MINGW32__)
extern "C" __declspec(dllimport) void __stdcall DebugBreak();
#define CATCH_TRAP() DebugBreak()
#endif

#ifndef CATCH_BREAK_INTO_DEBUGGER
#ifdef CATCH_TRAP
#define CATCH_BREAK_INTO_DEBUGGER()      \
    [] {                                 \
        if (Catch::isDebuggerActive()) { \
            CATCH_TRAP();                \
        }                                \
    }()
#else
#define CATCH_BREAK_INTO_DEBUGGER() [] {}()
#endif
#endif

// end catch_debugger.h
// start catch_run_context.h

// start catch_fatal_condition.h

#include <cassert>

namespace Catch {

// Wrapper for platform-specific fatal error (signals/SEH) handlers
//
// Tries to be cooperative with other handlers, and not step over
// other handlers. This means that unknown structured exceptions
// are passed on, previous signal handlers are called, and so on.
//
// Can only be instantiated once, and assumes that once a signal
// is caught, the binary will end up terminating. Thus, there
class FatalConditionHandler {
    bool m_started = false;

    // Install/disengage implementation for specific platform.
    // Should be if-defed to work on current platform, can assume
    // engage-disengage 1:1 pairing.
    void engage_platform();
    void disengage_platform();

public:
    // Should also have platform-specific implementations as needed
    FatalConditionHandler();
    ~FatalConditionHandler();

    void engage() {
        assert(!m_started && "Handler cannot be installed twice.");
        m_started = true;
        engage_platform();
    }

    void disengage() {
        assert(m_started && "Handler cannot be uninstalled without being installed first");
        m_started = false;
        disengage_platform();
    }
};

//! Simple RAII guard for (dis)engaging the FatalConditionHandler
class FatalConditionHandlerGuard {
    FatalConditionHandler *m_handler;

public:
    FatalConditionHandlerGuard(FatalConditionHandler *handler) : m_handler(handler) {
        m_handler->engage();
    }
    ~FatalConditionHandlerGuard() { m_handler->disengage(); }
};

}  // end namespace Catch

// end catch_fatal_condition.h
#include <string>

namespace Catch {

struct IMutableContext;

///////////////////////////////////////////////////////////////////////////

class RunContext : public IResultCapture, public IRunner {
public:
    RunContext(RunContext const &) = delete;
    RunContext &operator=(RunContext const &) = delete;

    explicit RunContext(IConfigPtr const &_config, IStreamingReporterPtr &&reporter);

    ~RunContext() override;

    void testGroupStarting(std::string const &testSpec,
                           std::size_t groupIndex,
                           std::size_t groupsCount);
    void testGroupEnded(std::string const &testSpec,
                        Totals const &totals,
                        std::size_t groupIndex,
                        std::size_t groupsCount);

    Totals runTest(TestCase const &testCase);

    IConfigPtr config() const;
    IStreamingReporter &reporter() const;

public:  // IResultCapture
    // Assertion handlers
    void handleExpr(AssertionInfo const &info,
                    ITransientExpression const &expr,
                    AssertionReaction &reaction) override;
    void handleMessage(AssertionInfo const &info,
                       ResultWas::OfType resultType,
                       StringRef const &message,
                       AssertionReaction &reaction) override;
    void handleUnexpectedExceptionNotThrown(AssertionInfo const &info,
                                            AssertionReaction &reaction) override;
    void handleUnexpectedInflightException(AssertionInfo const &info,
                                           std::string const &message,
                                           AssertionReaction &reaction) override;
    void handleIncomplete(AssertionInfo const &info) override;
    void handleNonExpr(AssertionInfo const &info,
                       ResultWas::OfType resultType,
                       AssertionReaction &reaction) override;

    bool sectionStarted(SectionInfo const &sectionInfo, Counts &assertions) override;

    void sectionEnded(SectionEndInfo const &endInfo) override;
    void sectionEndedEarly(SectionEndInfo const &endInfo) override;

    auto acquireGeneratorTracker(StringRef generatorName, SourceLineInfo const &lineInfo)
            -> IGeneratorTracker & override;

#if defined(CATCH_CONFIG_ENABLE_BENCHMARKING)
    void benchmarkPreparing(std::string const &name) override;
    void benchmarkStarting(BenchmarkInfo const &info) override;
    void benchmarkEnded(BenchmarkStats<> const &stats) override;
    void benchmarkFailed(std::string const &error) override;
#endif  // CATCH_CONFIG_ENABLE_BENCHMARKING

    void pushScopedMessage(MessageInfo const &message) override;
    void popScopedMessage(MessageInfo const &message) override;

    void emplaceUnscopedMessage(MessageBuilder const &builder) override;

    std::string getCurrentTestName() const override;

    const AssertionResult *getLastResult() const override;

    void exceptionEarlyReported() override;

    void handleFatalErrorCondition(StringRef message) override;

    bool lastAssertionPassed() override;

    void assertionPassed() override;

public:
    // !TBD We need to do this another way!
    bool aborting() const final;

private:
    void runCurrentTest(std::string &redirectedCout, std::string &redirectedCerr);
    void invokeActiveTestCase();

    void resetAssertionInfo();
    bool testForMissingAssertions(Counts &assertions);

    void assertionEnded(AssertionResult const &result);
    void reportExpr(AssertionInfo const &info,
                    ResultWas::OfType resultType,
                    ITransientExpression const *expr,
                    bool negated);

    void populateReaction(AssertionReaction &reaction);

private:
    void handleUnfinishedSections();

    TestRunInfo m_runInfo;
    IMutableContext &m_context;
    TestCase const *m_activeTestCase = nullptr;
    ITracker *m_testCaseTracker = nullptr;
    Option<AssertionResult> m_lastResult;

    IConfigPtr m_config;
    Totals m_totals;
    IStreamingReporterPtr m_reporter;
    std::vector<MessageInfo> m_messages;
    std::vector<ScopedMessage> m_messageScopes; /* Keeps owners of so-called unscoped messages. */
    AssertionInfo m_lastAssertionInfo;
    std::vector<SectionEndInfo> m_unfinishedSections;
    std::vector<ITracker *> m_activeSections;
    TrackerContext m_trackerContext;
    FatalConditionHandler m_fatalConditionhandler;
    bool m_lastAssertionPassed = false;
    bool m_shouldReportUnexpected = true;
    bool m_includeSuccessfulResults;
};

void seedRng(IConfig const &config);
unsigned int rngSeed();
}  // end namespace Catch

// end catch_run_context.h
namespace Catch {

namespace {
auto operator<<(std::ostream &os, ITransientExpression const &expr) -> std::ostream & {
    expr.streamReconstructedExpression(os);
    return os;
}
}  // namespace

LazyExpression::LazyExpression(bool isNegated) : m_isNegated(isNegated) {}

LazyExpression::LazyExpression(LazyExpression const &other) : m_isNegated(other.m_isNegated) {}

LazyExpression::operator bool() const { return m_transientExpression != nullptr; }

auto operator<<(std::ostream &os, LazyExpression const &lazyExpr) -> std::ostream & {
    if (lazyExpr.m_isNegated)
        os << "!";

    if (lazyExpr) {
        if (lazyExpr.m_isNegated && lazyExpr.m_transientExpression->isBinaryExpression())
            os << "(" << *lazyExpr.m_transientExpression << ")";
        else
            os << *lazyExpr.m_transientExpression;
    } else {
        os << "{** error - unchecked empty expression requested **}";
    }
    return os;
}

AssertionHandler::AssertionHandler(StringRef const &macroName,
                                   SourceLineInfo const &lineInfo,
                                   StringRef capturedExpression,
                                   ResultDisposition::Flags resultDisposition)
        : m_assertionInfo{macroName, lineInfo, capturedExpression, resultDisposition},
          m_resultCapture(getResultCapture()) {}

void AssertionHandler::handleExpr(ITransientExpression const &expr) {
    m_resultCapture.handleExpr(m_assertionInfo, expr, m_reaction);
}
void AssertionHandler::handleMessage(ResultWas::OfType resultType, StringRef const &message) {
    m_resultCapture.handleMessage(m_assertionInfo, resultType, message, m_reaction);
}

auto AssertionHandler::allowThrows() const -> bool {
    return getCurrentContext().getConfig()->allowThrows();
}

void AssertionHandler::complete() {
    setCompleted();
    if (m_reaction.shouldDebugBreak) {
        // If you find your debugger stopping you here then go one level up on the
        // call-stack for the code that caused it (typically a failed assertion)

        // (To go back to the test and change execution, jump over the throw, next)
        CATCH_BREAK_INTO_DEBUGGER();
    }
    if (m_reaction.shouldThrow) {
#if !defined(CATCH_CONFIG_DISABLE_EXCEPTIONS)
        throw Catch::TestFailureException();
#else
        CATCH_ERROR("Test failure requires aborting test!");
#endif
    }
}
void AssertionHandler::setCompleted() { m_completed = true; }

void AssertionHandler::handleUnexpectedInflightException() {
    m_resultCapture.handleUnexpectedInflightException(
            m_assertionInfo, Catch::translateActiveException(), m_reaction);
}

void AssertionHandler::handleExceptionThrownAsExpected() {
    m_resultCapture.handleNonExpr(m_assertionInfo, ResultWas::Ok, m_reaction);
}
void AssertionHandler::handleExceptionNotThrownAsExpected() {
    m_resultCapture.handleNonExpr(m_assertionInfo, ResultWas::Ok, m_reaction);
}

void AssertionHandler::handleUnexpectedExceptionNotThrown() {
    m_resultCapture.handleUnexpectedExceptionNotThrown(m_assertionInfo, m_reaction);
}

void AssertionHandler::handleThrowingCallSkipped() {
    m_resultCapture.handleNonExpr(m_assertionInfo, ResultWas::Ok, m_reaction);
}

// This is the overload that takes a string and infers the Equals matcher from
// it The more general overload, that takes any string matcher, is in
// catch_capture_matchers.cpp
void handleExceptionMatchExpr(AssertionHandler &handler,
                              std::string const &str,
                              StringRef const &matcherString) {
    handleExceptionMatchExpr(handler, Matchers::Equals(str), matcherString);
}

}  // namespace Catch
// end catch_assertionhandler.cpp
// start catch_assertionresult.cpp

namespace Catch {
AssertionResultData::AssertionResultData(ResultWas::OfType _resultType,
                                         LazyExpression const &_lazyExpression)
        : lazyExpression(_lazyExpression), resultType(_resultType) {}

std::string AssertionResultData::reconstructExpression() const {
    if (reconstructedExpression.empty()) {
        if (lazyExpression) {
            ReusableStringStream rss;
            rss << lazyExpression;
            reconstructedExpression = rss.str();
        }
    }
    return reconstructedExpression;
}

AssertionResult::AssertionResult(AssertionInfo const &info, AssertionResultData const &data)
        : m_info(info), m_resultData(data) {}

// Result was a success
bool AssertionResult::succeeded() const { return Catch::isOk(m_resultData.resultType); }

// Result was a success, or failure is suppressed
bool AssertionResult::isOk() const {
    return Catch::isOk(m_resultData.resultType) || shouldSuppressFailure(m_info.resultDisposition);
}

ResultWas::OfType AssertionResult::getResultType() const { return m_resultData.resultType; }

bool AssertionResult::hasExpression() const { return !m_info.capturedExpression.empty(); }

bool AssertionResult::hasMessage() const { return !m_resultData.message.empty(); }

std::string AssertionResult::getExpression() const {
    // Possibly overallocating by 3 characters should be basically free
    std::string expr;
    expr.reserve(m_info.capturedExpression.size() + 3);
    if (isFalseTest(m_info.resultDisposition)) {
        expr += "!(";
    }
    expr += m_info.capturedExpression;
    if (isFalseTest(m_info.resultDisposition)) {
        expr += ')';
    }
    return expr;
}

std::string AssertionResult::getExpressionInMacro() const {
    std::string expr;
    if (m_info.macroName.empty())
        expr = static_cast<std::string>(m_info.capturedExpression);
    else {
        expr.reserve(m_info.macroName.size() + m_info.capturedExpression.size() + 4);
        expr += m_info.macroName;
        expr += "( ";
        expr += m_info.capturedExpression;
        expr += " )";
    }
    return expr;
}

bool AssertionResult::hasExpandedExpression() const {
    return hasExpression() && getExpandedExpression() != getExpression();
}

std::string AssertionResult::getExpandedExpression() const {
    std::string expr = m_resultData.reconstructExpression();
    return expr.empty() ? getExpression() : expr;
}

std::string AssertionResult::getMessage() const { return m_resultData.message; }
SourceLineInfo AssertionResult::getSourceInfo() const { return m_info.lineInfo; }

StringRef AssertionResult::getTestMacroName() const { return m_info.macroName; }

}  // end namespace Catch
// end catch_assertionresult.cpp
// start catch_capture_matchers.cpp

namespace Catch {

using StringMatcher = Matchers::Impl::MatcherBase<std::string>;

// This is the general overload that takes a any string matcher
// There is another overload, in catch_assertionhandler.h/.cpp, that only takes
// a string and infers the Equals matcher (so the header does not mention
// matchers)
void handleExceptionMatchExpr(AssertionHandler &handler,
                              StringMatcher const &matcher,
                              StringRef const &matcherString) {
    std::string exceptionMessage = Catch::translateActiveException();
    MatchExpr<std::string, StringMatcher const &> expr(exceptionMessage, matcher, matcherString);
    handler.handleExpr(expr);
}

}  // namespace Catch
// end catch_capture_matchers.cpp
// start catch_commandline.cpp

// start catch_commandline.h

// start catch_clara.h

// Use Catch's value for console width (store Clara's off to the side, if
// present)
#ifdef CLARA_CONFIG_CONSOLE_WIDTH
#define CATCH_TEMP_CLARA_CONFIG_CONSOLE_WIDTH CATCH_CLARA_TEXTFLOW_CONFIG_CONSOLE_WIDTH
#undef CATCH_CLARA_TEXTFLOW_CONFIG_CONSOLE_WIDTH
#endif
#define CATCH_CLARA_TEXTFLOW_CONFIG_CONSOLE_WIDTH CATCH_CONFIG_CONSOLE_WIDTH - 1

#ifdef __clang__
#pragma clang diagnostic push
#pragma clang diagnostic ignored "-Wweak-vtables"
#pragma clang diagnostic ignored "-Wexit-time-destructors"
#pragma clang diagnostic ignored "-Wshadow"
#endif

// start clara.hpp
// Copyright 2017 Two Blue Cubes Ltd. All rights reserved.
//
// Distributed under the Boost Software License, Version 1.0. (See accompanying
// file LICENSE_1_0.txt or copy at http://www.boost.org/LICENSE_1_0.txt)
//
// See https://github.com/philsquared/Clara for more details

// Clara v1.1.5

#ifndef CATCH_CLARA_CONFIG_CONSOLE_WIDTH
#define CATCH_CLARA_CONFIG_CONSOLE_WIDTH 80
#endif

#ifndef CATCH_CLARA_TEXTFLOW_CONFIG_CONSOLE_WIDTH
#define CATCH_CLARA_TEXTFLOW_CONFIG_CONSOLE_WIDTH CATCH_CLARA_CONFIG_CONSOLE_WIDTH
#endif

#ifndef CLARA_CONFIG_OPTIONAL_TYPE
#ifdef __has_include
#if __has_include(<optional>) && __cplusplus >= 201703L
#include <optional>
#define CLARA_CONFIG_OPTIONAL_TYPE std::optional
#endif
#endif
#endif

// ----------- #included from clara_textflow.hpp -----------

// TextFlowCpp
//
// A single-header library for wrapping and laying out basic text, by Phil Nash
//
// Distributed under the Boost Software License, Version 1.0. (See accompanying
// file LICENSE.txt or copy at http://www.boost.org/LICENSE_1_0.txt)
//
// This project is hosted at https://github.com/philsquared/textflowcpp

#include <cassert>
#include <ostream>
#include <sstream>
#include <vector>

#ifndef CATCH_CLARA_TEXTFLOW_CONFIG_CONSOLE_WIDTH
#define CATCH_CLARA_TEXTFLOW_CONFIG_CONSOLE_WIDTH 80
#endif

namespace Catch {
namespace clara {
namespace TextFlow {

inline auto isWhitespace(char c) -> bool {
    static std::string chars = " \t\n\r";
    return chars.find(c) != std::string::npos;
}
inline auto isBreakableBefore(char c) -> bool {
    static std::string chars = "[({<|";
    return chars.find(c) != std::string::npos;
}
inline auto isBreakableAfter(char c) -> bool {
    static std::string chars = "])}>.,:;*+-=&/\\";
    return chars.find(c) != std::string::npos;
}

class Columns;

class Column {
    std::vector<std::string> m_strings;
    size_t m_width = CATCH_CLARA_TEXTFLOW_CONFIG_CONSOLE_WIDTH;
    size_t m_indent = 0;
    size_t m_initialIndent = std::string::npos;

public:
    class iterator {
        friend Column;

        Column const &m_column;
        size_t m_stringIndex = 0;
        size_t m_pos = 0;

        size_t m_len = 0;
        size_t m_end = 0;
        bool m_suffix = false;

        iterator(Column const &column, size_t stringIndex)
                : m_column(column), m_stringIndex(stringIndex) {}

        auto line() const -> std::string const & { return m_column.m_strings[m_stringIndex]; }

        auto isBoundary(size_t at) const -> bool {
            assert(at > 0);
            assert(at <= line().size());

            return at == line().size() ||
                   (isWhitespace(line()[at]) && !isWhitespace(line()[at - 1])) ||
                   isBreakableBefore(line()[at]) || isBreakableAfter(line()[at - 1]);
        }

        void calcLength() {
            assert(m_stringIndex < m_column.m_strings.size());

            m_suffix = false;
            auto width = m_column.m_width - indent();
            m_end = m_pos;
            if (line()[m_pos] == '\n') {
                ++m_end;
            }
            while (m_end < line().size() && line()[m_end] != '\n')
                ++m_end;

            if (m_end < m_pos + width) {
                m_len = m_end - m_pos;
            } else {
                size_t len = width;
                while (len > 0 && !isBoundary(m_pos + len))
                    --len;
                while (len > 0 && isWhitespace(line()[m_pos + len - 1]))
                    --len;

                if (len > 0) {
                    m_len = len;
                } else {
                    m_suffix = true;
                    m_len = width - 1;
                }
            }
        }

        auto indent() const -> size_t {
            auto initial =
                    m_pos == 0 && m_stringIndex == 0 ? m_column.m_initialIndent : std::string::npos;
            return initial == std::string::npos ? m_column.m_indent : initial;
        }

        auto addIndentAndSuffix(std::string const &plain) const -> std::string {
            return std::string(indent(), ' ') + (m_suffix ? plain + "-" : plain);
        }

    public:
        using difference_type = std::ptrdiff_t;
        using value_type = std::string;
        using pointer = value_type *;
        using reference = value_type &;
        using iterator_category = std::forward_iterator_tag;

        explicit iterator(Column const &column) : m_column(column) {
            assert(m_column.m_width > m_column.m_indent);
            assert(m_column.m_initialIndent == std::string::npos ||
                   m_column.m_width > m_column.m_initialIndent);
            calcLength();
            if (m_len == 0)
                m_stringIndex++;  // Empty string
        }

        auto operator*() const -> std::string {
            assert(m_stringIndex < m_column.m_strings.size());
            assert(m_pos <= m_end);
            return addIndentAndSuffix(line().substr(m_pos, m_len));
        }

        auto operator++() -> iterator & {
            m_pos += m_len;
            if (m_pos < line().size() && line()[m_pos] == '\n')
                m_pos += 1;
            else
                while (m_pos < line().size() && isWhitespace(line()[m_pos]))
                    ++m_pos;

            if (m_pos == line().size()) {
                m_pos = 0;
                ++m_stringIndex;
            }
            if (m_stringIndex < m_column.m_strings.size())
                calcLength();
            return *this;
        }
        auto operator++(int) -> iterator {
            iterator prev(*this);
            operator++();
            return prev;
        }

        auto operator==(iterator const &other) const -> bool {
            return m_pos == other.m_pos && m_stringIndex == other.m_stringIndex &&
                   &m_column == &other.m_column;
        }
        auto operator!=(iterator const &other) const -> bool { return !operator==(other); }
    };
    using const_iterator = iterator;

    explicit Column(std::string const &text) { m_strings.push_back(text); }

    auto width(size_t newWidth) -> Column & {
        assert(newWidth > 0);
        m_width = newWidth;
        return *this;
    }
    auto indent(size_t newIndent) -> Column & {
        m_indent = newIndent;
        return *this;
    }
    auto initialIndent(size_t newIndent) -> Column & {
        m_initialIndent = newIndent;
        return *this;
    }

    auto width() const -> size_t { return m_width; }
    auto begin() const -> iterator { return iterator(*this); }
    auto end() const -> iterator { return {*this, m_strings.size()}; }

    inline friend std::ostream &operator<<(std::ostream &os, Column const &col) {
        bool first = true;
        for (auto line : col) {
            if (first)
                first = false;
            else
                os << "\n";
            os << line;
        }
        return os;
    }

    auto operator+(Column const &other) -> Columns;

    auto toString() const -> std::string {
        std::ostringstream oss;
        oss << *this;
        return oss.str();
    }
};

class Spacer : public Column {
public:
    explicit Spacer(size_t spaceWidth) : Column("") { width(spaceWidth); }
};

class Columns {
    std::vector<Column> m_columns;

public:
    class iterator {
        friend Columns;
        struct EndTag {};

        std::vector<Column> const &m_columns;
        std::vector<Column::iterator> m_iterators;
        size_t m_activeIterators;

        iterator(Columns const &columns, EndTag)
                : m_columns(columns.m_columns), m_activeIterators(0) {
            m_iterators.reserve(m_columns.size());

            for (auto const &col : m_columns)
                m_iterators.push_back(col.end());
        }

    public:
        using difference_type = std::ptrdiff_t;
        using value_type = std::string;
        using pointer = value_type *;
        using reference = value_type &;
        using iterator_category = std::forward_iterator_tag;

        explicit iterator(Columns const &columns)
                : m_columns(columns.m_columns), m_activeIterators(m_columns.size()) {
            m_iterators.reserve(m_columns.size());

            for (auto const &col : m_columns)
                m_iterators.push_back(col.begin());
        }

        auto operator==(iterator const &other) const -> bool {
            return m_iterators == other.m_iterators;
        }
        auto operator!=(iterator const &other) const -> bool {
            return m_iterators != other.m_iterators;
        }
        auto operator*() const -> std::string {
            std::string row, padding;

            for (size_t i = 0; i < m_columns.size(); ++i) {
                auto width = m_columns[i].width();
                if (m_iterators[i] != m_columns[i].end()) {
                    std::string col = *m_iterators[i];
                    row += padding + col;
                    if (col.size() < width)
                        padding = std::string(width - col.size(), ' ');
                    else
                        padding = "";
                } else {
                    padding += std::string(width, ' ');
                }
            }
            return row;
        }
        auto operator++() -> iterator & {
            for (size_t i = 0; i < m_columns.size(); ++i) {
                if (m_iterators[i] != m_columns[i].end())
                    ++m_iterators[i];
            }
            return *this;
        }
        auto operator++(int) -> iterator {
            iterator prev(*this);
            operator++();
            return prev;
        }
    };
    using const_iterator = iterator;

    auto begin() const -> iterator { return iterator(*this); }
    auto end() const -> iterator { return {*this, iterator::EndTag()}; }

    auto operator+=(Column const &col) -> Columns & {
        m_columns.push_back(col);
        return *this;
    }
    auto operator+(Column const &col) -> Columns {
        Columns combined = *this;
        combined += col;
        return combined;
    }

    inline friend std::ostream &operator<<(std::ostream &os, Columns const &cols) {
        bool first = true;
        for (auto line : cols) {
            if (first)
                first = false;
            else
                os << "\n";
            os << line;
        }
        return os;
    }

    auto toString() const -> std::string {
        std::ostringstream oss;
        oss << *this;
        return oss.str();
    }
};

inline auto Column::operator+(Column const &other) -> Columns {
    Columns cols;
    cols += *this;
    cols += other;
    return cols;
}
}  // namespace TextFlow

}  // namespace clara
}  // namespace Catch

// ----------- end of #include from clara_textflow.hpp -----------
// ........... back in clara.hpp

#include <algorithm>
#include <cctype>
#include <memory>
#include <set>
#include <string>

#if !defined(CATCH_PLATFORM_WINDOWS) && \
        (defined(WIN32) || defined(__WIN32__) || defined(_WIN32) || defined(_MSC_VER))
#define CATCH_PLATFORM_WINDOWS
#endif

namespace Catch {
namespace clara {
namespace detail {

// Traits for extracting arg and return type of lambdas (for single argument
// lambdas)
template <typename L>
struct UnaryLambdaTraits : UnaryLambdaTraits<decltype(&L::operator())> {};

template <typename ClassT, typename ReturnT, typename... Args>
struct UnaryLambdaTraits<ReturnT (ClassT::*)(Args...) const> {
    static const bool isValid = false;
};

template <typename ClassT, typename ReturnT, typename ArgT>
struct UnaryLambdaTraits<ReturnT (ClassT::*)(ArgT) const> {
    static const bool isValid = true;
    using ArgType = typename std::remove_const<typename std::remove_reference<ArgT>::type>::type;
    using ReturnType = ReturnT;
};

class TokenStream;

// Transport for raw args (copied from main args, or supplied via init list for
// testing)
class Args {
    friend TokenStream;
    std::string m_exeName;
    std::vector<std::string> m_args;

public:
    Args(int argc, char const *const *argv) : m_exeName(argv[0]), m_args(argv + 1, argv + argc) {}

    Args(std::initializer_list<std::string> args)
            : m_exeName(*args.begin()), m_args(args.begin() + 1, args.end()) {}

    auto exeName() const -> std::string { return m_exeName; }
};

// Wraps a token coming from a token stream. These may not directly correspond
// to strings as a single string may encode an option + its argument if the : or
// = form is used
enum class TokenType { Option, Argument };
struct Token {
    TokenType type;
    std::string token;
};

inline auto isOptPrefix(char c) -> bool {
    return c == '-'
#ifdef CATCH_PLATFORM_WINDOWS
           || c == '/'
#endif
            ;
}

// Abstracts iterators into args as a stream of tokens, with option arguments
// uniformly handled
class TokenStream {
    using Iterator = std::vector<std::string>::const_iterator;
    Iterator it;
    Iterator itEnd;
    std::vector<Token> m_tokenBuffer;

    void loadBuffer() {
        m_tokenBuffer.resize(0);

        // Skip any empty strings
        while (it != itEnd && it->empty())
            ++it;

        if (it != itEnd) {
            auto const &next = *it;
            if (isOptPrefix(next[0])) {
                auto delimiterPos = next.find_first_of(" :=");
                if (delimiterPos != std::string::npos) {
                    m_tokenBuffer.push_back({TokenType::Option, next.substr(0, delimiterPos)});
                    m_tokenBuffer.push_back({TokenType::Argument, next.substr(delimiterPos + 1)});
                } else {
                    if (next[1] != '-' && next.size() > 2) {
                        std::string opt = "- ";
                        for (size_t i = 1; i < next.size(); ++i) {
                            opt[1] = next[i];
                            m_tokenBuffer.push_back({TokenType::Option, opt});
                        }
                    } else {
                        m_tokenBuffer.push_back({TokenType::Option, next});
                    }
                }
            } else {
                m_tokenBuffer.push_back({TokenType::Argument, next});
            }
        }
    }

public:
    explicit TokenStream(Args const &args) : TokenStream(args.m_args.begin(), args.m_args.end()) {}

    TokenStream(Iterator it, Iterator itEnd) : it(it), itEnd(itEnd) { loadBuffer(); }

    explicit operator bool() const { return !m_tokenBuffer.empty() || it != itEnd; }

    auto count() const -> size_t { return m_tokenBuffer.size() + (itEnd - it); }

    auto operator*() const -> Token {
        assert(!m_tokenBuffer.empty());
        return m_tokenBuffer.front();
    }

    auto operator->() const -> Token const * {
        assert(!m_tokenBuffer.empty());
        return &m_tokenBuffer.front();
    }

    auto operator++() -> TokenStream & {
        if (m_tokenBuffer.size() >= 2) {
            m_tokenBuffer.erase(m_tokenBuffer.begin());
        } else {
            if (it != itEnd)
                ++it;
            loadBuffer();
        }
        return *this;
    }
};

class ResultBase {
public:
    enum Type { Ok, LogicError, RuntimeError };

protected:
    ResultBase(Type type) : m_type(type) {}
    virtual ~ResultBase() = default;

    virtual void enforceOk() const = 0;

    Type m_type;
};

template <typename T>
class ResultValueBase : public ResultBase {
public:
    auto value() const -> T const & {
        enforceOk();
        return m_value;
    }

protected:
    ResultValueBase(Type type) : ResultBase(type) {}

    ResultValueBase(ResultValueBase const &other) : ResultBase(other) {
        if (m_type == ResultBase::Ok)
            new (&m_value) T(other.m_value);
    }

    ResultValueBase(Type, T const &value) : ResultBase(Ok) { new (&m_value) T(value); }

    auto operator=(ResultValueBase const &other) -> ResultValueBase & {
        if (m_type == ResultBase::Ok)
            m_value.~T();
        ResultBase::operator=(other);
        if (m_type == ResultBase::Ok)
            new (&m_value) T(other.m_value);
        return *this;
    }

    ~ResultValueBase() override {
        if (m_type == Ok)
            m_value.~T();
    }

    union {
        T m_value;
    };
};

template <>
class ResultValueBase<void> : public ResultBase {
protected:
    using ResultBase::ResultBase;
};

template <typename T = void>
class BasicResult : public ResultValueBase<T> {
public:
    template <typename U>
    explicit BasicResult(BasicResult<U> const &other)
            : ResultValueBase<T>(other.type()), m_errorMessage(other.errorMessage()) {
        assert(type() != ResultBase::Ok);
    }

    template <typename U>
    static auto ok(U const &value) -> BasicResult {
        return {ResultBase::Ok, value};
    }
    static auto ok() -> BasicResult { return {ResultBase::Ok}; }
    static auto logicError(std::string const &message) -> BasicResult {
        return {ResultBase::LogicError, message};
    }
    static auto runtimeError(std::string const &message) -> BasicResult {
        return {ResultBase::RuntimeError, message};
    }

    explicit operator bool() const { return m_type == ResultBase::Ok; }
    auto type() const -> ResultBase::Type { return m_type; }
    auto errorMessage() const -> std::string { return m_errorMessage; }

protected:
    void enforceOk() const override {
        // Errors shouldn't reach this point, but if they do
        // the actual error message will be in m_errorMessage
        assert(m_type != ResultBase::LogicError);
        assert(m_type != ResultBase::RuntimeError);
        if (m_type != ResultBase::Ok)
            std::abort();
    }

    std::string m_errorMessage;  // Only populated if resultType is an error

    BasicResult(ResultBase::Type type, std::string const &message)
            : ResultValueBase<T>(type), m_errorMessage(message) {
        assert(m_type != ResultBase::Ok);
    }

    using ResultValueBase<T>::ResultValueBase;
    using ResultBase::m_type;
};

enum class ParseResultType { Matched, NoMatch, ShortCircuitAll, ShortCircuitSame };

class ParseState {
public:
    ParseState(ParseResultType type, TokenStream const &remainingTokens)
            : m_type(type), m_remainingTokens(remainingTokens) {}

    auto type() const -> ParseResultType { return m_type; }
    auto remainingTokens() const -> TokenStream { return m_remainingTokens; }

private:
    ParseResultType m_type;
    TokenStream m_remainingTokens;
};

using Result = BasicResult<void>;
using ParserResult = BasicResult<ParseResultType>;
using InternalParseResult = BasicResult<ParseState>;

struct HelpColumns {
    std::string left;
    std::string right;
};

template <typename T>
inline auto convertInto(std::string const &source, T &target) -> ParserResult {
    std::stringstream ss;
    ss << source;
    ss >> target;
    if (ss.fail())
        return ParserResult::runtimeError("Unable to convert '" + source + "' to destination type");
    else
        return ParserResult::ok(ParseResultType::Matched);
}
inline auto convertInto(std::string const &source, std::string &target) -> ParserResult {
    target = source;
    return ParserResult::ok(ParseResultType::Matched);
}
inline auto convertInto(std::string const &source, bool &target) -> ParserResult {
    std::string srcLC = source;
    std::transform(srcLC.begin(), srcLC.end(), srcLC.begin(),
                   [](unsigned char c) { return static_cast<char>(std::tolower(c)); });
    if (srcLC == "y" || srcLC == "1" || srcLC == "true" || srcLC == "yes" || srcLC == "on")
        target = true;
    else if (srcLC == "n" || srcLC == "0" || srcLC == "false" || srcLC == "no" || srcLC == "off")
        target = false;
    else
        return ParserResult::runtimeError("Expected a boolean value but did not recognise: '" +
                                          source + "'");
    return ParserResult::ok(ParseResultType::Matched);
}
#ifdef CLARA_CONFIG_OPTIONAL_TYPE
template <typename T>
inline auto convertInto(std::string const &source, CLARA_CONFIG_OPTIONAL_TYPE<T> &target)
        -> ParserResult {
    T temp;
    auto result = convertInto(source, temp);
    if (result)
        target = std::move(temp);
    return result;
}
#endif  // CLARA_CONFIG_OPTIONAL_TYPE

struct NonCopyable {
    NonCopyable() = default;
    NonCopyable(NonCopyable const &) = delete;
    NonCopyable(NonCopyable &&) = delete;
    NonCopyable &operator=(NonCopyable const &) = delete;
    NonCopyable &operator=(NonCopyable &&) = delete;
};

struct BoundRef : NonCopyable {
    virtual ~BoundRef() = default;
    virtual auto isContainer() const -> bool { return false; }
    virtual auto isFlag() const -> bool { return false; }
};
struct BoundValueRefBase : BoundRef {
    virtual auto setValue(std::string const &arg) -> ParserResult = 0;
};
struct BoundFlagRefBase : BoundRef {
    virtual auto setFlag(bool flag) -> ParserResult = 0;
    virtual auto isFlag() const -> bool { return true; }
};

template <typename T>
struct BoundValueRef : BoundValueRefBase {
    T &m_ref;

    explicit BoundValueRef(T &ref) : m_ref(ref) {}

    auto setValue(std::string const &arg) -> ParserResult override {
        return convertInto(arg, m_ref);
    }
};

template <typename T>
struct BoundValueRef<std::vector<T>> : BoundValueRefBase {
    std::vector<T> &m_ref;

    explicit BoundValueRef(std::vector<T> &ref) : m_ref(ref) {}

    auto isContainer() const -> bool override { return true; }

    auto setValue(std::string const &arg) -> ParserResult override {
        T temp;
        auto result = convertInto(arg, temp);
        if (result)
            m_ref.push_back(temp);
        return result;
    }
};

struct BoundFlagRef : BoundFlagRefBase {
    bool &m_ref;

    explicit BoundFlagRef(bool &ref) : m_ref(ref) {}

    auto setFlag(bool flag) -> ParserResult override {
        m_ref = flag;
        return ParserResult::ok(ParseResultType::Matched);
    }
};

template <typename ReturnType>
struct LambdaInvoker {
    static_assert(std::is_same<ReturnType, ParserResult>::value,
                  "Lambda must return void or clara::ParserResult");

    template <typename L, typename ArgType>
    static auto invoke(L const &lambda, ArgType const &arg) -> ParserResult {
        return lambda(arg);
    }
};

template <>
struct LambdaInvoker<void> {
    template <typename L, typename ArgType>
    static auto invoke(L const &lambda, ArgType const &arg) -> ParserResult {
        lambda(arg);
        return ParserResult::ok(ParseResultType::Matched);
    }
};

template <typename ArgType, typename L>
inline auto invokeLambda(L const &lambda, std::string const &arg) -> ParserResult {
    ArgType temp{};
    auto result = convertInto(arg, temp);
    return !result ? result
                   : LambdaInvoker<typename UnaryLambdaTraits<L>::ReturnType>::invoke(lambda, temp);
}

template <typename L>
struct BoundLambda : BoundValueRefBase {
    L m_lambda;

    static_assert(UnaryLambdaTraits<L>::isValid, "Supplied lambda must take exactly one argument");
    explicit BoundLambda(L const &lambda) : m_lambda(lambda) {}

    auto setValue(std::string const &arg) -> ParserResult override {
        return invokeLambda<typename UnaryLambdaTraits<L>::ArgType>(m_lambda, arg);
    }
};

template <typename L>
struct BoundFlagLambda : BoundFlagRefBase {
    L m_lambda;

    static_assert(UnaryLambdaTraits<L>::isValid, "Supplied lambda must take exactly one argument");
    static_assert(std::is_same<typename UnaryLambdaTraits<L>::ArgType, bool>::value,
                  "flags must be boolean");

    explicit BoundFlagLambda(L const &lambda) : m_lambda(lambda) {}

    auto setFlag(bool flag) -> ParserResult override {
        return LambdaInvoker<typename UnaryLambdaTraits<L>::ReturnType>::invoke(m_lambda, flag);
    }
};

enum class Optionality { Optional, Required };

struct Parser;

class ParserBase {
public:
    virtual ~ParserBase() = default;
    virtual auto validate() const -> Result { return Result::ok(); }
    virtual auto parse(std::string const &exeName, TokenStream const &tokens) const
            -> InternalParseResult = 0;
    virtual auto cardinality() const -> size_t { return 1; }

    auto parse(Args const &args) const -> InternalParseResult {
        return parse(args.exeName(), TokenStream(args));
    }
};

template <typename DerivedT>
class ComposableParserImpl : public ParserBase {
public:
    template <typename T>
    auto operator|(T const &other) const -> Parser;

    template <typename T>
    auto operator+(T const &other) const -> Parser;
};

// Common code and state for Args and Opts
template <typename DerivedT>
class ParserRefImpl : public ComposableParserImpl<DerivedT> {
protected:
    Optionality m_optionality = Optionality::Optional;
    std::shared_ptr<BoundRef> m_ref;
    std::string m_hint;
    std::string m_description;

    explicit ParserRefImpl(std::shared_ptr<BoundRef> const &ref) : m_ref(ref) {}

public:
    template <typename T>
    ParserRefImpl(T &ref, std::string const &hint)
            : m_ref(std::make_shared<BoundValueRef<T>>(ref)), m_hint(hint) {}

    template <typename LambdaT>
    ParserRefImpl(LambdaT const &ref, std::string const &hint)
            : m_ref(std::make_shared<BoundLambda<LambdaT>>(ref)), m_hint(hint) {}

    auto operator()(std::string const &description) -> DerivedT & {
        m_description = description;
        return static_cast<DerivedT &>(*this);
    }

    auto optional() -> DerivedT & {
        m_optionality = Optionality::Optional;
        return static_cast<DerivedT &>(*this);
    };

    auto required() -> DerivedT & {
        m_optionality = Optionality::Required;
        return static_cast<DerivedT &>(*this);
    };

    auto isOptional() const -> bool { return m_optionality == Optionality::Optional; }

    auto cardinality() const -> size_t override {
        if (m_ref->isContainer())
            return 0;
        else
            return 1;
    }

    auto hint() const -> std::string { return m_hint; }
};

class ExeName : public ComposableParserImpl<ExeName> {
    std::shared_ptr<std::string> m_name;
    std::shared_ptr<BoundValueRefBase> m_ref;

    template <typename LambdaT>
    static auto makeRef(LambdaT const &lambda) -> std::shared_ptr<BoundValueRefBase> {
        return std::make_shared<BoundLambda<LambdaT>>(lambda);
    }

public:
    ExeName() : m_name(std::make_shared<std::string>("<executable>")) {}

    explicit ExeName(std::string &ref) : ExeName() {
        m_ref = std::make_shared<BoundValueRef<std::string>>(ref);
    }

    template <typename LambdaT>
    explicit ExeName(LambdaT const &lambda) : ExeName() {
        m_ref = std::make_shared<BoundLambda<LambdaT>>(lambda);
    }

    // The exe name is not parsed out of the normal tokens, but is handled
    // specially
    auto parse(std::string const &, TokenStream const &tokens) const
            -> InternalParseResult override {
        return InternalParseResult::ok(ParseState(ParseResultType::NoMatch, tokens));
    }

    auto name() const -> std::string { return *m_name; }
    auto set(std::string const &newName) -> ParserResult {
        auto lastSlash = newName.find_last_of("\\/");
        auto filename = (lastSlash == std::string::npos) ? newName : newName.substr(lastSlash + 1);

        *m_name = filename;
        if (m_ref)
            return m_ref->setValue(filename);
        else
            return ParserResult::ok(ParseResultType::Matched);
    }
};

class Arg : public ParserRefImpl<Arg> {
public:
    using ParserRefImpl::ParserRefImpl;

    auto parse(std::string const &, TokenStream const &tokens) const
            -> InternalParseResult override {
        auto validationResult = validate();
        if (!validationResult)
            return InternalParseResult(validationResult);

        auto remainingTokens = tokens;
        auto const &token = *remainingTokens;
        if (token.type != TokenType::Argument)
            return InternalParseResult::ok(ParseState(ParseResultType::NoMatch, remainingTokens));

        assert(!m_ref->isFlag());
        auto valueRef = static_cast<detail::BoundValueRefBase *>(m_ref.get());

        auto result = valueRef->setValue(remainingTokens->token);
        if (!result)
            return InternalParseResult(result);
        else
            return InternalParseResult::ok(ParseState(ParseResultType::Matched, ++remainingTokens));
    }
};

inline auto normaliseOpt(std::string const &optName) -> std::string {
#ifdef CATCH_PLATFORM_WINDOWS
    if (optName[0] == '/')
        return "-" + optName.substr(1);
    else
#endif
        return optName;
}

class Opt : public ParserRefImpl<Opt> {
protected:
    std::vector<std::string> m_optNames;

public:
    template <typename LambdaT>
    explicit Opt(LambdaT const &ref)
            : ParserRefImpl(std::make_shared<BoundFlagLambda<LambdaT>>(ref)) {}

    explicit Opt(bool &ref) : ParserRefImpl(std::make_shared<BoundFlagRef>(ref)) {}

    template <typename LambdaT>
    Opt(LambdaT const &ref, std::string const &hint) : ParserRefImpl(ref, hint) {}

    template <typename T>
    Opt(T &ref, std::string const &hint) : ParserRefImpl(ref, hint) {}

    auto operator[](std::string const &optName) -> Opt & {
        m_optNames.push_back(optName);
        return *this;
    }

    auto getHelpColumns() const -> std::vector<HelpColumns> {
        std::ostringstream oss;
        bool first = true;
        for (auto const &opt : m_optNames) {
            if (first)
                first = false;
            else
                oss << ", ";
            oss << opt;
        }
        if (!m_hint.empty())
            oss << " <" << m_hint << ">";
        return {{oss.str(), m_description}};
    }

    auto isMatch(std::string const &optToken) const -> bool {
        auto normalisedToken = normaliseOpt(optToken);
        for (auto const &name : m_optNames) {
            if (normaliseOpt(name) == normalisedToken)
                return true;
        }
        return false;
    }

    using ParserBase::parse;

    auto parse(std::string const &, TokenStream const &tokens) const
            -> InternalParseResult override {
        auto validationResult = validate();
        if (!validationResult)
            return InternalParseResult(validationResult);

        auto remainingTokens = tokens;
        if (remainingTokens && remainingTokens->type == TokenType::Option) {
            auto const &token = *remainingTokens;
            if (isMatch(token.token)) {
                if (m_ref->isFlag()) {
                    auto flagRef = static_cast<detail::BoundFlagRefBase *>(m_ref.get());
                    auto result = flagRef->setFlag(true);
                    if (!result)
                        return InternalParseResult(result);
                    if (result.value() == ParseResultType::ShortCircuitAll)
                        return InternalParseResult::ok(ParseState(result.value(), remainingTokens));
                } else {
                    auto valueRef = static_cast<detail::BoundValueRefBase *>(m_ref.get());
                    ++remainingTokens;
                    if (!remainingTokens)
                        return InternalParseResult::runtimeError("Expected argument following " +
                                                                 token.token);
                    auto const &argToken = *remainingTokens;
                    if (argToken.type != TokenType::Argument)
                        return InternalParseResult::runtimeError("Expected argument following " +
                                                                 token.token);
                    auto result = valueRef->setValue(argToken.token);
                    if (!result)
                        return InternalParseResult(result);
                    if (result.value() == ParseResultType::ShortCircuitAll)
                        return InternalParseResult::ok(ParseState(result.value(), remainingTokens));
                }
                return InternalParseResult::ok(
                        ParseState(ParseResultType::Matched, ++remainingTokens));
            }
        }
        return InternalParseResult::ok(ParseState(ParseResultType::NoMatch, remainingTokens));
    }

    auto validate() const -> Result override {
        if (m_optNames.empty())
            return Result::logicError("No options supplied to Opt");
        for (auto const &name : m_optNames) {
            if (name.empty())
                return Result::logicError("Option name cannot be empty");
#ifdef CATCH_PLATFORM_WINDOWS
            if (name[0] != '-' && name[0] != '/')
                return Result::logicError("Option name must begin with '-' or '/'");
#else
            if (name[0] != '-')
                return Result::logicError("Option name must begin with '-'");
#endif
        }
        return ParserRefImpl::validate();
    }
};

struct Help : Opt {
    Help(bool &showHelpFlag)
            : Opt([&](bool flag) {
                  showHelpFlag = flag;
                  return ParserResult::ok(ParseResultType::ShortCircuitAll);
              }) {
        static_cast<Opt &> (*this)("display usage information")["-?"]["-h"]["--help"].optional();
    }
};

struct Parser : ParserBase {
    mutable ExeName m_exeName;
    std::vector<Opt> m_options;
    std::vector<Arg> m_args;

    auto operator|=(ExeName const &exeName) -> Parser & {
        m_exeName = exeName;
        return *this;
    }

    auto operator|=(Arg const &arg) -> Parser & {
        m_args.push_back(arg);
        return *this;
    }

    auto operator|=(Opt const &opt) -> Parser & {
        m_options.push_back(opt);
        return *this;
    }

    auto operator|=(Parser const &other) -> Parser & {
        m_options.insert(m_options.end(), other.m_options.begin(), other.m_options.end());
        m_args.insert(m_args.end(), other.m_args.begin(), other.m_args.end());
        return *this;
    }

    template <typename T>
    auto operator|(T const &other) const -> Parser {
        return Parser(*this) |= other;
    }

    // Forward deprecated interface with '+' instead of '|'
    template <typename T>
    auto operator+=(T const &other) -> Parser & {
        return operator|=(other);
    }
    template <typename T>
    auto operator+(T const &other) const -> Parser {
        return operator|(other);
    }

    auto getHelpColumns() const -> std::vector<HelpColumns> {
        std::vector<HelpColumns> cols;
        for (auto const &o : m_options) {
            auto childCols = o.getHelpColumns();
            cols.insert(cols.end(), childCols.begin(), childCols.end());
        }
        return cols;
    }

    void writeToStream(std::ostream &os) const {
        if (!m_exeName.name().empty()) {
            os << "usage:\n"
               << "  " << m_exeName.name() << " ";
            bool required = true, first = true;
            for (auto const &arg : m_args) {
                if (first)
                    first = false;
                else
                    os << " ";
                if (arg.isOptional() && required) {
                    os << "[";
                    required = false;
                }
                os << "<" << arg.hint() << ">";
                if (arg.cardinality() == 0)
                    os << " ... ";
            }
            if (!required)
                os << "]";
            if (!m_options.empty())
                os << " options";
            os << "\n\nwhere options are:" << std::endl;
        }

        auto rows = getHelpColumns();
        size_t consoleWidth = CATCH_CLARA_CONFIG_CONSOLE_WIDTH;
        size_t optWidth = 0;
        for (auto const &cols : rows)
            optWidth = (std::max)(optWidth, cols.left.size() + 2);

        optWidth = (std::min)(optWidth, consoleWidth / 2);

        for (auto const &cols : rows) {
            auto row = TextFlow::Column(cols.left).width(optWidth).indent(2) + TextFlow::Spacer(4) +
                       TextFlow::Column(cols.right).width(consoleWidth - 7 - optWidth);
            os << row << std::endl;
        }
    }

    friend auto operator<<(std::ostream &os, Parser const &parser) -> std::ostream & {
        parser.writeToStream(os);
        return os;
    }

    auto validate() const -> Result override {
        for (auto const &opt : m_options) {
            auto result = opt.validate();
            if (!result)
                return result;
        }
        for (auto const &arg : m_args) {
            auto result = arg.validate();
            if (!result)
                return result;
        }
        return Result::ok();
    }

    using ParserBase::parse;

    auto parse(std::string const &exeName, TokenStream const &tokens) const
            -> InternalParseResult override {
        struct ParserInfo {
            ParserBase const *parser = nullptr;
            size_t count = 0;
        };
        const size_t totalParsers = m_options.size() + m_args.size();
        assert(totalParsers < 512);
        // ParserInfo parseInfos[totalParsers]; // <-- this is what we really want
        // to do
        ParserInfo parseInfos[512];

        {
            size_t i = 0;
            for (auto const &opt : m_options)
                parseInfos[i++].parser = &opt;
            for (auto const &arg : m_args)
                parseInfos[i++].parser = &arg;
        }

        m_exeName.set(exeName);

        auto result = InternalParseResult::ok(ParseState(ParseResultType::NoMatch, tokens));
        while (result.value().remainingTokens()) {
            bool tokenParsed = false;

            for (size_t i = 0; i < totalParsers; ++i) {
                auto &parseInfo = parseInfos[i];
                if (parseInfo.parser->cardinality() == 0 ||
                    parseInfo.count < parseInfo.parser->cardinality()) {
                    result = parseInfo.parser->parse(exeName, result.value().remainingTokens());
                    if (!result)
                        return result;
                    if (result.value().type() != ParseResultType::NoMatch) {
                        tokenParsed = true;
                        ++parseInfo.count;
                        break;
                    }
                }
            }

            if (result.value().type() == ParseResultType::ShortCircuitAll)
                return result;
            if (!tokenParsed)
                return InternalParseResult::runtimeError("Unrecognised token: " +
                                                         result.value().remainingTokens()->token);
        }
        // !TBD Check missing required options
        return result;
    }
};

template <typename DerivedT>
template <typename T>
auto ComposableParserImpl<DerivedT>::operator|(T const &other) const -> Parser {
    return Parser() | static_cast<DerivedT const &>(*this) | other;
}
}  // namespace detail

// A Combined parser
using detail::Parser;

// A parser for options
using detail::Opt;

// A parser for arguments
using detail::Arg;

// Wrapper for argc, argv from main()
using detail::Args;

// Specifies the name of the executable
using detail::ExeName;

// Convenience wrapper for option parser that specifies the help option
using detail::Help;

// enum of result types from a parse
using detail::ParseResultType;

// Result type for parser operation
using detail::ParserResult;

}  // namespace clara
}  // namespace Catch

// end clara.hpp
#ifdef __clang__
#pragma clang diagnostic pop
#endif

// Restore Clara's value for console width, if present
#ifdef CATCH_TEMP_CLARA_CONFIG_CONSOLE_WIDTH
#define CATCH_CLARA_TEXTFLOW_CONFIG_CONSOLE_WIDTH CATCH_TEMP_CLARA_CONFIG_CONSOLE_WIDTH
#undef CATCH_TEMP_CLARA_CONFIG_CONSOLE_WIDTH
#endif

// end catch_clara.h
namespace Catch {

clara::Parser makeCommandLineParser(ConfigData &config);

}  // end namespace Catch

// end catch_commandline.h
#include <ctime>
#include <fstream>

namespace Catch {

clara::Parser makeCommandLineParser(ConfigData &config) {
    using namespace clara;

    auto const setWarning = [&](std::string const &warning) {
        auto warningSet = [&]() {
            if (warning == "NoAssertions")
                return WarnAbout::NoAssertions;

            if (warning == "NoTests")
                return WarnAbout::NoTests;

            return WarnAbout::Nothing;
        }();

        if (warningSet == WarnAbout::Nothing)
            return ParserResult::runtimeError("Unrecognised warning: '" + warning + "'");
        config.warnings = static_cast<WarnAbout::What>(config.warnings | warningSet);
        return ParserResult::ok(ParseResultType::Matched);
    };
    auto const loadTestNamesFromFile = [&](std::string const &filename) {
        std::ifstream f(filename.c_str());
        if (!f.is_open())
            return ParserResult::runtimeError("Unable to load input file: '" + filename + "'");

        std::string line;
        while (std::getline(f, line)) {
            line = trim(line);
            if (!line.empty() && !startsWith(line, '#')) {
                if (!startsWith(line, '"'))
                    line = '"' + line + '"';
                config.testsOrTags.push_back(line);
                config.testsOrTags.emplace_back(",");
            }
        }
        // Remove comma in the end
        if (!config.testsOrTags.empty())
            config.testsOrTags.erase(config.testsOrTags.end() - 1);

        return ParserResult::ok(ParseResultType::Matched);
    };
    auto const setTestOrder = [&](std::string const &order) {
        if (startsWith("declared", order))
            config.runOrder = RunTests::InDeclarationOrder;
        else if (startsWith("lexical", order))
            config.runOrder = RunTests::InLexicographicalOrder;
        else if (startsWith("random", order))
            config.runOrder = RunTests::InRandomOrder;
        else
            return clara::ParserResult::runtimeError("Unrecognised ordering: '" + order + "'");
        return ParserResult::ok(ParseResultType::Matched);
    };
    auto const setRngSeed = [&](std::string const &seed) {
        if (seed != "time")
            return clara::detail::convertInto(seed, config.rngSeed);
        config.rngSeed = static_cast<unsigned int>(std::time(nullptr));
        return ParserResult::ok(ParseResultType::Matched);
    };
    auto const setColourUsage = [&](std::string const &useColour) {
        auto mode = toLower(useColour);

        if (mode == "yes")
            config.useColour = UseColour::Yes;
        else if (mode == "no")
            config.useColour = UseColour::No;
        else if (mode == "auto")
            config.useColour = UseColour::Auto;
        else
            return ParserResult::runtimeError("colour mode must be one of: auto, yes or no. '" +
                                              useColour + "' not recognised");
        return ParserResult::ok(ParseResultType::Matched);
    };
    auto const setWaitForKeypress = [&](std::string const &keypress) {
        auto keypressLc = toLower(keypress);
        if (keypressLc == "never")
            config.waitForKeypress = WaitForKeypress::Never;
        else if (keypressLc == "start")
            config.waitForKeypress = WaitForKeypress::BeforeStart;
        else if (keypressLc == "exit")
            config.waitForKeypress = WaitForKeypress::BeforeExit;
        else if (keypressLc == "both")
            config.waitForKeypress = WaitForKeypress::BeforeStartAndExit;
        else
            return ParserResult::runtimeError(
                    "keypress argument must be one of: never, start, exit or both. '" + keypress +
                    "' not recognised");
        return ParserResult::ok(ParseResultType::Matched);
    };
    auto const setVerbosity = [&](std::string const &verbosity) {
        auto lcVerbosity = toLower(verbosity);
        if (lcVerbosity == "quiet")
            config.verbosity = Verbosity::Quiet;
        else if (lcVerbosity == "normal")
            config.verbosity = Verbosity::Normal;
        else if (lcVerbosity == "high")
            config.verbosity = Verbosity::High;
        else
            return ParserResult::runtimeError("Unrecognised verbosity, '" + verbosity + "'");
        return ParserResult::ok(ParseResultType::Matched);
    };
    auto const setReporter = [&](std::string const &reporter) {
        IReporterRegistry::FactoryMap const &factories =
                getRegistryHub().getReporterRegistry().getFactories();

        auto lcReporter = toLower(reporter);
        auto result = factories.find(lcReporter);

        if (factories.end() != result)
            config.reporterName = lcReporter;
        else
            return ParserResult::runtimeError("Unrecognized reporter, '" + reporter +
                                              "'. Check available with --list-reporters");
        return ParserResult::ok(ParseResultType::Matched);
    };

    auto cli =
            ExeName(config.processName) | Help(config.showHelp) |
            Opt(config.listTests)["-l"]["--list-tests"]("list all/matching test cases") |
            Opt(config.listTags)["-t"]["--list-tags"]("list all/matching tags") |
            Opt(config.showSuccessfulTests)["-s"]["--success"](
                    "include successful tests in output") |
            Opt(config.shouldDebugBreak)["-b"]["--break"]("break into debugger on failure") |
            Opt(config.noThrow)["-e"]["--nothrow"]("skip exception tests") |
            Opt(config.showInvisibles)["-i"]["--invisibles"]("show invisibles (tabs, newlines)") |
            Opt(config.outputFilename, "filename")["-o"]["--out"]("output filename") |
            Opt(setReporter, "name")["-r"]["--reporter"]("reporter to use (defaults to console)") |
            Opt(config.name, "name")["-n"]["--name"]("suite name") |
            Opt([&](bool) { config.abortAfter = 1; })["-a"]["--abort"]("abort at first failure") |
            Opt([&](int x) { config.abortAfter = x; },
                "no. failures")["-x"]["--abortx"]("abort after x failures") |
            Opt(setWarning, "warning name")["-w"]["--warn"]("enable warnings") |
            Opt(
                    [&](bool flag) {
                        config.showDurations = flag ? ShowDurations::Always : ShowDurations::Never;
                    },
                    "yes|no")["-d"]["--durations"]("show test durations") |
            Opt(config.minDuration, "seconds")["-D"]["--min-duration"](
                    "show test durations for tests taking at least the given number of "
                    "seconds") |
            Opt(loadTestNamesFromFile,
                "filename")["-f"]["--input-file"]("load test names to run from a file") |
            Opt(config.filenamesAsTags)["-#"]["--filenames-as-tags"](
                    "adds a tag for the filename") |
            Opt(config.sectionsToRun, "section name")["-c"]["--section"]("specify section to run") |
            Opt(setVerbosity, "quiet|normal|high")["-v"]["--verbosity"]("set output verbosity") |
            Opt(config.listTestNamesOnly)["--list-test-names-only"](
                    "list all/matching test cases names only") |
            Opt(config.listReporters)["--list-reporters"]("list all reporters") |
            Opt(setTestOrder, "decl|lex|rand")["--order"]("test case order (defaults to decl)") |
            Opt(setRngSeed,
                "'time'|number")["--rng-seed"]("set a specific seed for random numbers") |
            Opt(setColourUsage, "yes|no")["--use-colour"]("should output be colourised") |
            Opt(config.libIdentify)["--libidentify"](
                    "report name and version according to libidentify standard") |
            Opt(setWaitForKeypress, "never|start|exit|both")["--wait-for-keypress"](
                    "waits for a keypress before exiting") |
            Opt(config.benchmarkSamples,
                "samples")["--benchmark-samples"]("number of samples to collect (default: 100)") |
            Opt(config.benchmarkResamples, "resamples")["--benchmark-resamples"](
                    "number of resamples for the bootstrap (default: 100000)") |
            Opt(config.benchmarkConfidenceInterval,
                "confidence interval")["--benchmark-confidence-interval"](
                    "confidence interval for the bootstrap (between 0 and 1, default: "
                    "0.95)") |
            Opt(config.benchmarkNoAnalysis)["--benchmark-no-analysis"](
                    "perform only measurements; do not perform any analysis") |
            Opt(config.benchmarkWarmupTime, "benchmarkWarmupTime")["--benchmark-warmup-time"](
                    "amount of time in milliseconds spent on warming up each test "
                    "(default: 100)") |
            Arg(config.testsOrTags, "test name|pattern|tags")("which test or tests to use");

    return cli;
}

}  // end namespace Catch
// end catch_commandline.cpp
// start catch_common.cpp

#include <cstring>
#include <ostream>

namespace Catch {

bool SourceLineInfo::operator==(SourceLineInfo const &other) const noexcept {
    return line == other.line && (file == other.file || std::strcmp(file, other.file) == 0);
}
bool SourceLineInfo::operator<(SourceLineInfo const &other) const noexcept {
    // We can assume that the same file will usually have the same pointer.
    // Thus, if the pointers are the same, there is no point in calling the strcmp
    return line < other.line ||
           (line == other.line && file != other.file && (std::strcmp(file, other.file) < 0));
}

std::ostream &operator<<(std::ostream &os, SourceLineInfo const &info) {
#ifndef __GNUG__
    os << info.file << '(' << info.line << ')';
#else
    os << info.file << ':' << info.line;
#endif
    return os;
}

std::string StreamEndStop::operator+() const { return std::string(); }

NonCopyable::NonCopyable() = default;
NonCopyable::~NonCopyable() = default;

}  // namespace Catch
// end catch_common.cpp
// start catch_config.cpp

namespace Catch {

Config::Config(ConfigData const &data) : m_data(data), m_stream(openStream()) {
    // We need to trim filter specs to avoid trouble with superfluous
    // whitespace (esp. important for bdd macros, as those are manually
    // aligned with whitespace).

    for (auto &elem : m_data.testsOrTags) {
        elem = trim(elem);
    }
    for (auto &elem : m_data.sectionsToRun) {
        elem = trim(elem);
    }

    TestSpecParser parser(ITagAliasRegistry::get());
    if (!m_data.testsOrTags.empty()) {
        m_hasTestFilters = true;
        for (auto const &testOrTags : m_data.testsOrTags) {
            parser.parse(testOrTags);
        }
    }
    m_testSpec = parser.testSpec();
}

std::string const &Config::getFilename() const { return m_data.outputFilename; }

bool Config::listTests() const { return m_data.listTests; }
bool Config::listTestNamesOnly() const { return m_data.listTestNamesOnly; }
bool Config::listTags() const { return m_data.listTags; }
bool Config::listReporters() const { return m_data.listReporters; }

std::string Config::getProcessName() const { return m_data.processName; }
std::string const &Config::getReporterName() const { return m_data.reporterName; }

std::vector<std::string> const &Config::getTestsOrTags() const { return m_data.testsOrTags; }
std::vector<std::string> const &Config::getSectionsToRun() const { return m_data.sectionsToRun; }

TestSpec const &Config::testSpec() const { return m_testSpec; }
bool Config::hasTestFilters() const { return m_hasTestFilters; }

bool Config::showHelp() const { return m_data.showHelp; }

// IConfig interface
bool Config::allowThrows() const { return !m_data.noThrow; }
std::ostream &Config::stream() const { return m_stream->stream(); }
std::string Config::name() const { return m_data.name.empty() ? m_data.processName : m_data.name; }
bool Config::includeSuccessfulResults() const { return m_data.showSuccessfulTests; }
bool Config::warnAboutMissingAssertions() const {
    return !!(m_data.warnings & WarnAbout::NoAssertions);
}
bool Config::warnAboutNoTests() const { return !!(m_data.warnings & WarnAbout::NoTests); }
ShowDurations::OrNot Config::showDurations() const { return m_data.showDurations; }
double Config::minDuration() const { return m_data.minDuration; }
RunTests::InWhatOrder Config::runOrder() const { return m_data.runOrder; }
unsigned int Config::rngSeed() const { return m_data.rngSeed; }
UseColour::YesOrNo Config::useColour() const { return m_data.useColour; }
bool Config::shouldDebugBreak() const { return m_data.shouldDebugBreak; }
int Config::abortAfter() const { return m_data.abortAfter; }
bool Config::showInvisibles() const { return m_data.showInvisibles; }
Verbosity Config::verbosity() const { return m_data.verbosity; }

bool Config::benchmarkNoAnalysis() const { return m_data.benchmarkNoAnalysis; }
int Config::benchmarkSamples() const { return m_data.benchmarkSamples; }
double Config::benchmarkConfidenceInterval() const { return m_data.benchmarkConfidenceInterval; }
unsigned int Config::benchmarkResamples() const { return m_data.benchmarkResamples; }
std::chrono::milliseconds Config::benchmarkWarmupTime() const {
    return std::chrono::milliseconds(m_data.benchmarkWarmupTime);
}

IStream const *Config::openStream() { return Catch::makeStream(m_data.outputFilename); }

}  // end namespace Catch
// end catch_config.cpp
// start catch_console_colour.cpp

#if defined(__clang__)
#pragma clang diagnostic push
#pragma clang diagnostic ignored "-Wexit-time-destructors"
#endif

// start catch_errno_guard.h

namespace Catch {

class ErrnoGuard {
public:
    ErrnoGuard();
    ~ErrnoGuard();

private:
    int m_oldErrno;
};

}  // namespace Catch

// end catch_errno_guard.h
// start catch_windows_h_proxy.h

#if defined(CATCH_PLATFORM_WINDOWS)

#if !defined(NOMINMAX) && !defined(CATCH_CONFIG_NO_NOMINMAX)
#define CATCH_DEFINED_NOMINMAX
#define NOMINMAX
#endif
#if !defined(WIN32_LEAN_AND_MEAN) && !defined(CATCH_CONFIG_NO_WIN32_LEAN_AND_MEAN)
#define CATCH_DEFINED_WIN32_LEAN_AND_MEAN
#define WIN32_LEAN_AND_MEAN
#endif

#ifdef __AFXDLL
#include <AfxWin.h>
#else
#include <windows.h>
#endif

#ifdef CATCH_DEFINED_NOMINMAX
#undef NOMINMAX
#endif
#ifdef CATCH_DEFINED_WIN32_LEAN_AND_MEAN
#undef WIN32_LEAN_AND_MEAN
#endif

#endif  // defined(CATCH_PLATFORM_WINDOWS)

// end catch_windows_h_proxy.h
#include <sstream>

namespace Catch {
namespace {

struct IColourImpl {
    virtual ~IColourImpl() = default;
    virtual void use(Colour::Code _colourCode) = 0;
};

struct NoColourImpl : IColourImpl {
    void use(Colour::Code) override {}

    static IColourImpl *instance() {
        static NoColourImpl s_instance;
        return &s_instance;
    }
};

}  // namespace
}  // namespace Catch

#if !defined(CATCH_CONFIG_COLOUR_NONE) && !defined(CATCH_CONFIG_COLOUR_WINDOWS) && \
        !defined(CATCH_CONFIG_COLOUR_ANSI)
#ifdef CATCH_PLATFORM_WINDOWS
#define CATCH_CONFIG_COLOUR_WINDOWS
#else
#define CATCH_CONFIG_COLOUR_ANSI
#endif
#endif

#if defined(CATCH_CONFIG_COLOUR_WINDOWS)  /////////////////////////////////////////

namespace Catch {
namespace {

class Win32ColourImpl : public IColourImpl {
public:
    Win32ColourImpl() : stdoutHandle(GetStdHandle(STD_OUTPUT_HANDLE)) {
        CONSOLE_SCREEN_BUFFER_INFO csbiInfo;
        GetConsoleScreenBufferInfo(stdoutHandle, &csbiInfo);
        originalForegroundAttributes =
                csbiInfo.wAttributes &
                ~(BACKGROUND_GREEN | BACKGROUND_RED | BACKGROUND_BLUE | BACKGROUND_INTENSITY);
        originalBackgroundAttributes =
                csbiInfo.wAttributes &
                ~(FOREGROUND_GREEN | FOREGROUND_RED | FOREGROUND_BLUE | FOREGROUND_INTENSITY);
    }

    void use(Colour::Code _colourCode) override {
        switch (_colourCode) {
        case Colour::None:
            return setTextAttribute(originalForegroundAttributes);
        case Colour::White:
            return setTextAttribute(FOREGROUND_GREEN | FOREGROUND_RED | FOREGROUND_BLUE);
        case Colour::Red:
            return setTextAttribute(FOREGROUND_RED);
        case Colour::Green:
            return setTextAttribute(FOREGROUND_GREEN);
        case Colour::Blue:
            return setTextAttribute(FOREGROUND_BLUE);
        case Colour::Cyan:
            return setTextAttribute(FOREGROUND_BLUE | FOREGROUND_GREEN);
        case Colour::Yellow:
            return setTextAttribute(FOREGROUND_RED | FOREGROUND_GREEN);
        case Colour::Grey:
            return setTextAttribute(0);

        case Colour::LightGrey:
            return setTextAttribute(FOREGROUND_INTENSITY);
        case Colour::BrightRed:
            return setTextAttribute(FOREGROUND_INTENSITY | FOREGROUND_RED);
        case Colour::BrightGreen:
            return setTextAttribute(FOREGROUND_INTENSITY | FOREGROUND_GREEN);
        case Colour::BrightWhite:
            return setTextAttribute(FOREGROUND_INTENSITY | FOREGROUND_GREEN | FOREGROUND_RED |
                                    FOREGROUND_BLUE);
        case Colour::BrightYellow:
            return setTextAttribute(FOREGROUND_INTENSITY | FOREGROUND_RED | FOREGROUND_GREEN);

        case Colour::Bright:
            CATCH_INTERNAL_ERROR("not a colour");

        default:
            CATCH_ERROR("Unknown colour requested");
        }
    }

private:
    void setTextAttribute(WORD _textAttribute) {
        SetConsoleTextAttribute(stdoutHandle, _textAttribute | originalBackgroundAttributes);
    }
    HANDLE stdoutHandle;
    WORD originalForegroundAttributes;
    WORD originalBackgroundAttributes;
};

IColourImpl *platformColourInstance() {
    static Win32ColourImpl s_instance;

    IConfigPtr config = getCurrentContext().getConfig();
    UseColour::YesOrNo colourMode = config ? config->useColour() : UseColour::Auto;
    if (colourMode == UseColour::Auto)
        colourMode = UseColour::Yes;
    return colourMode == UseColour::Yes ? &s_instance : NoColourImpl::instance();
}

}  // namespace
}  // end namespace Catch

#elif defined(CATCH_CONFIG_COLOUR_ANSI)  //////////////////////////////////////

#include <unistd.h>

namespace Catch {
namespace {

// use POSIX/ ANSI console terminal codes
// Thanks to Adam Strzelecki for original contribution
// (http://github.com/nanoant)
// https://github.com/philsquared/Catch/pull/131
class PosixColourImpl : public IColourImpl {
public:
    void use(Colour::Code _colourCode) override {
        switch (_colourCode) {
        case Colour::None:
        case Colour::White:
            return setColour("[0m");
        case Colour::Red:
            return setColour("[0;31m");
        case Colour::Green:
            return setColour("[0;32m");
        case Colour::Blue:
            return setColour("[0;34m");
        case Colour::Cyan:
            return setColour("[0;36m");
        case Colour::Yellow:
            return setColour("[0;33m");
        case Colour::Grey:
            return setColour("[1;30m");

        case Colour::LightGrey:
            return setColour("[0;37m");
        case Colour::BrightRed:
            return setColour("[1;31m");
        case Colour::BrightGreen:
            return setColour("[1;32m");
        case Colour::BrightWhite:
            return setColour("[1;37m");
        case Colour::BrightYellow:
            return setColour("[1;33m");

        case Colour::Bright:
            CATCH_INTERNAL_ERROR("not a colour");
        default:
            CATCH_INTERNAL_ERROR("Unknown colour requested");
        }
    }
    static IColourImpl *instance() {
        static PosixColourImpl s_instance;
        return &s_instance;
    }

private:
    void setColour(const char *_escapeCode) {
        getCurrentContext().getConfig()->stream() << '\033' << _escapeCode;
    }
};

bool useColourOnPlatform() {
    return
#if defined(CATCH_PLATFORM_MAC) || defined(CATCH_PLATFORM_IPHONE)
            !isDebuggerActive() &&
#endif
#if !(defined(__DJGPP__) && defined(__STRICT_ANSI__))
            isatty(STDOUT_FILENO)
#else
            false
#endif
                    ;
}
IColourImpl *platformColourInstance() {
    ErrnoGuard guard;
    IConfigPtr config = getCurrentContext().getConfig();
    UseColour::YesOrNo colourMode = config ? config->useColour() : UseColour::Auto;
    if (colourMode == UseColour::Auto)
        colourMode = useColourOnPlatform() ? UseColour::Yes : UseColour::No;
    return colourMode == UseColour::Yes ? PosixColourImpl::instance() : NoColourImpl::instance();
}

}  // namespace
}  // end namespace Catch

#else  // not Windows or ANSI ///////////////////////////////////////////////

namespace Catch {

static IColourImpl *platformColourInstance() { return NoColourImpl::instance(); }

}  // end namespace Catch

#endif  // Windows/ ANSI/ None

namespace Catch {

Colour::Colour(Code _colourCode) { use(_colourCode); }
Colour::Colour(Colour &&other) noexcept {
    m_moved = other.m_moved;
    other.m_moved = true;
}
Colour &Colour::operator=(Colour &&other) noexcept {
    m_moved = other.m_moved;
    other.m_moved = true;
    return *this;
}

Colour::~Colour() {
    if (!m_moved)
        use(None);
}

void Colour::use(Code _colourCode) {
    static IColourImpl *impl = platformColourInstance();
    // Strictly speaking, this cannot possibly happen.
    // However, under some conditions it does happen (see #1626),
    // and this change is small enough that we can let practicality
    // triumph over purity in this case.
    if (impl != nullptr) {
        impl->use(_colourCode);
    }
}

std::ostream &operator<<(std::ostream &os, Colour const &) { return os; }

}  // end namespace Catch

#if defined(__clang__)
#pragma clang diagnostic pop
#endif

// end catch_console_colour.cpp
// start catch_context.cpp

namespace Catch {

class Context : public IMutableContext, NonCopyable {
public:  // IContext
    IResultCapture *getResultCapture() override { return m_resultCapture; }
    IRunner *getRunner() override { return m_runner; }

    IConfigPtr const &getConfig() const override { return m_config; }

    ~Context() override;

public:  // IMutableContext
    void setResultCapture(IResultCapture *resultCapture) override {
        m_resultCapture = resultCapture;
    }
    void setRunner(IRunner *runner) override { m_runner = runner; }
    void setConfig(IConfigPtr const &config) override { m_config = config; }

    friend IMutableContext &getCurrentMutableContext();

private:
    IConfigPtr m_config;
    IRunner *m_runner = nullptr;
    IResultCapture *m_resultCapture = nullptr;
};

IMutableContext *IMutableContext::currentContext = nullptr;

void IMutableContext::createContext() { currentContext = new Context(); }

void cleanUpContext() {
    delete IMutableContext::currentContext;
    IMutableContext::currentContext = nullptr;
}
IContext::~IContext() = default;
IMutableContext::~IMutableContext() = default;
Context::~Context() = default;

SimplePcg32 &rng() {
    static SimplePcg32 s_rng;
    return s_rng;
}

}  // namespace Catch
// end catch_context.cpp
// start catch_debug_console.cpp

// start catch_debug_console.h

#include <string>

namespace Catch {
void writeToDebugConsole(std::string const &text);
}

// end catch_debug_console.h
#if defined(CATCH_CONFIG_ANDROID_LOGWRITE)
#include <android/log.h>

namespace Catch {
void writeToDebugConsole(std::string const &text) {
    __android_log_write(ANDROID_LOG_DEBUG, "Catch", text.c_str());
}
}  // namespace Catch

#elif defined(CATCH_PLATFORM_WINDOWS)

namespace Catch {
void writeToDebugConsole(std::string const &text) { ::OutputDebugStringA(text.c_str()); }
}  // namespace Catch

#else

namespace Catch {
void writeToDebugConsole(std::string const &text) {
    // !TBD: Need a version for Mac/ XCode and other IDEs
    Catch::cout() << text;
}
}  // namespace Catch

#endif  // Platform
// end catch_debug_console.cpp
// start catch_debugger.cpp

#if defined(CATCH_PLATFORM_MAC) || defined(CATCH_PLATFORM_IPHONE)

#include <sys/types.h>
#include <unistd.h>

#include <cassert>
#include <cstddef>
#include <ostream>

#ifdef __apple_build_version__
// These headers will only compile with AppleClang (XCode)
// For other compilers (Clang, GCC, ... ) we need to exclude them
#include <sys/sysctl.h>
#endif

namespace Catch {
#ifdef __apple_build_version__
// The following function is taken directly from the following technical note:
// https://developer.apple.com/library/archive/qa/qa1361/_index.html

// Returns true if the current process is being debugged (either
// running under the debugger or has a debugger attached post facto).
bool isDebuggerActive() {
    int mib[4];
    struct kinfo_proc info;
    std::size_t size;

    // Initialize the flags so that, if sysctl fails for some bizarre
    // reason, we get a predictable result.

    info.kp_proc.p_flag = 0;

    // Initialize mib, which tells sysctl the info we want, in this case
    // we're looking for information about a specific process ID.

    mib[0] = CTL_KERN;
    mib[1] = KERN_PROC;
    mib[2] = KERN_PROC_PID;
    mib[3] = getpid();

    // Call sysctl.

    size = sizeof(info);
    if (sysctl(mib, sizeof(mib) / sizeof(*mib), &info, &size, nullptr, 0) != 0) {
        Catch::cerr() << "\n** Call to sysctl failed - unable to determine if "
                         "debugger is active **\n"
                      << std::endl;
        return false;
    }

    // We're being debugged if the P_TRACED flag is set.

    return ((info.kp_proc.p_flag & P_TRACED) != 0);
}
#else
bool isDebuggerActive() {
    // We need to find another way to determine this for non-appleclang compilers
    // on macOS
    return false;
}
#endif
}  // namespace Catch

#elif defined(CATCH_PLATFORM_LINUX)
#include <fstream>
#include <string>

namespace Catch {
// The standard POSIX way of detecting a debugger is to attempt to
// ptrace() the process, but this needs to be done from a child and not
// this process itself to still allow attaching to this process later
// if wanted, so is rather heavy. Under Linux we have the PID of the
// "debugger" (which doesn't need to be gdb, of course, it could also
// be strace, for example) in /proc/$PID/status, so just get it from
// there instead.
bool isDebuggerActive() {
    // Libstdc++ has a bug, where std::ifstream sets errno to 0
    // This way our users can properly assert over errno values
    ErrnoGuard guard;
    std::ifstream in("/proc/self/status");
    for (std::string line; std::getline(in, line);) {
        static const int PREFIX_LEN = 11;
        if (line.compare(0, PREFIX_LEN, "TracerPid:\t") == 0) {
            // We're traced if the PID is not 0 and no other PID starts
            // with 0 digit, so it's enough to check for just a single
            // character.
            return line.length() > PREFIX_LEN && line[PREFIX_LEN] != '0';
        }
    }

    return false;
}
}  // namespace Catch
#elif defined(_MSC_VER)
extern "C" __declspec(dllimport) int __stdcall IsDebuggerPresent();
namespace Catch {
bool isDebuggerActive() { return IsDebuggerPresent() != 0; }
}  // namespace Catch
#elif defined(__MINGW32__)
extern "C" __declspec(dllimport) int __stdcall IsDebuggerPresent();
namespace Catch {
bool isDebuggerActive() { return IsDebuggerPresent() != 0; }
}  // namespace Catch
#else
namespace Catch {
bool isDebuggerActive() { return false; }
}  // namespace Catch
#endif  // Platform
// end catch_debugger.cpp
// start catch_decomposer.cpp

namespace Catch {

ITransientExpression::~ITransientExpression() = default;

void formatReconstructedExpression(std::ostream &os,
                                   std::string const &lhs,
                                   StringRef op,
                                   std::string const &rhs) {
    if (lhs.size() + rhs.size() < 40 && lhs.find('\n') == std::string::npos &&
        rhs.find('\n') == std::string::npos)
        os << lhs << " " << op << " " << rhs;
    else
        os << lhs << "\n" << op << "\n" << rhs;
}
}  // namespace Catch
// end catch_decomposer.cpp
// start catch_enforce.cpp

#include <stdexcept>

namespace Catch {
#if defined(CATCH_CONFIG_DISABLE_EXCEPTIONS) && \
        !defined(CATCH_CONFIG_DISABLE_EXCEPTIONS_CUSTOM_HANDLER)
[[noreturn]] void throw_exception(std::exception const &e) {
    Catch::cerr() << "Catch will terminate because it needed to throw an exception.\n"
                  << "The message was: " << e.what() << '\n';
    std::terminate();
}
#endif

[[noreturn]] void throw_logic_error(std::string const &msg) {
    throw_exception(std::logic_error(msg));
}

[[noreturn]] void throw_domain_error(std::string const &msg) {
    throw_exception(std::domain_error(msg));
}

[[noreturn]] void throw_runtime_error(std::string const &msg) {
    throw_exception(std::runtime_error(msg));
}

}  // namespace Catch
// end catch_enforce.cpp
// start catch_enum_values_registry.cpp
// start catch_enum_values_registry.h

#include <memory>
#include <vector>

namespace Catch {

namespace Detail {

std::unique_ptr<EnumInfo> makeEnumInfo(StringRef enumName,
                                       StringRef allValueNames,
                                       std::vector<int> const &values);

class EnumValuesRegistry : public IMutableEnumValuesRegistry {
    std::vector<std::unique_ptr<EnumInfo>> m_enumInfos;

    EnumInfo const &registerEnum(StringRef enumName,
                                 StringRef allEnums,
                                 std::vector<int> const &values) override;
};

std::vector<StringRef> parseEnums(StringRef enums);

}  // namespace Detail

}  // namespace Catch

// end catch_enum_values_registry.h

#include <cassert>
#include <map>

namespace Catch {

IMutableEnumValuesRegistry::~IMutableEnumValuesRegistry() {}

namespace Detail {

namespace {
// Extracts the actual name part of an enum instance
// In other words, it returns the Blue part of Bikeshed::Colour::Blue
StringRef extractInstanceName(StringRef enumInstance) {
    // Find last occurrence of ":"
    size_t name_start = enumInstance.size();
    while (name_start > 0 && enumInstance[name_start - 1] != ':') {
        --name_start;
    }
    return enumInstance.substr(name_start, enumInstance.size() - name_start);
}
}  // namespace

std::vector<StringRef> parseEnums(StringRef enums) {
    auto enumValues = splitStringRef(enums, ',');
    std::vector<StringRef> parsed;
    parsed.reserve(enumValues.size());
    for (auto const &enumValue : enumValues) {
        parsed.push_back(trim(extractInstanceName(enumValue)));
    }
    return parsed;
}

EnumInfo::~EnumInfo() {}

StringRef EnumInfo::lookup(int value) const {
    for (auto const &valueToName : m_values) {
        if (valueToName.first == value)
            return valueToName.second;
    }
    return "{** unexpected enum value **}"_sr;
}

std::unique_ptr<EnumInfo> makeEnumInfo(StringRef enumName,
                                       StringRef allValueNames,
                                       std::vector<int> const &values) {
    std::unique_ptr<EnumInfo> enumInfo(new EnumInfo);
    enumInfo->m_name = enumName;
    enumInfo->m_values.reserve(values.size());

    const auto valueNames = Catch::Detail::parseEnums(allValueNames);
    assert(valueNames.size() == values.size());
    std::size_t i = 0;
    for (auto value : values)
        enumInfo->m_values.emplace_back(value, valueNames[i++]);

    return enumInfo;
}

EnumInfo const &EnumValuesRegistry::registerEnum(StringRef enumName,
                                                 StringRef allValueNames,
                                                 std::vector<int> const &values) {
    m_enumInfos.push_back(makeEnumInfo(enumName, allValueNames, values));
    return *m_enumInfos.back();
}

}  // namespace Detail
}  // namespace Catch

// end catch_enum_values_registry.cpp
// start catch_errno_guard.cpp

#include <cerrno>

namespace Catch {
ErrnoGuard::ErrnoGuard() : m_oldErrno(errno) {}
ErrnoGuard::~ErrnoGuard() { errno = m_oldErrno; }
}  // namespace Catch
// end catch_errno_guard.cpp
// start catch_exception_translator_registry.cpp

// start catch_exception_translator_registry.h

#include <memory>
#include <string>
#include <vector>

namespace Catch {

class ExceptionTranslatorRegistry : public IExceptionTranslatorRegistry {
public:
    ~ExceptionTranslatorRegistry();
    virtual void registerTranslator(const IExceptionTranslator *translator);
    std::string translateActiveException() const override;
    std::string tryTranslators() const;

private:
    std::vector<std::unique_ptr<IExceptionTranslator const>> m_translators;
};
}  // namespace Catch

// end catch_exception_translator_registry.h
#ifdef __OBJC__
#import "Foundation/Foundation.h"
#endif

namespace Catch {

ExceptionTranslatorRegistry::~ExceptionTranslatorRegistry() {}

void ExceptionTranslatorRegistry::registerTranslator(const IExceptionTranslator *translator) {
    m_translators.push_back(std::unique_ptr<const IExceptionTranslator>(translator));
}

#if !defined(CATCH_CONFIG_DISABLE_EXCEPTIONS)
std::string ExceptionTranslatorRegistry::translateActiveException() const {
    try {
#ifdef __OBJC__
        // In Objective-C try objective-c exceptions first
        @try {
            return tryTranslators();
        } @catch (NSException *exception) {
            return Catch::Detail::stringify([exception description]);
        }
#else
        // Compiling a mixed mode project with MSVC means that CLR
        // exceptions will be caught in (...) as well. However, these
        // do not fill-in std::current_exception and thus lead to crash
        // when attempting rethrow.
        // /EHa switch also causes structured exceptions to be caught
        // here, but they fill-in current_exception properly, so
        // at worst the output should be a little weird, instead of
        // causing a crash.
        if (std::current_exception() == nullptr) {
            return "Non C++ exception. Possibly a CLR exception.";
        }
        return tryTranslators();
#endif
    } catch (TestFailureException &) {
        std::rethrow_exception(std::current_exception());
    } catch (std::exception &ex) {
        return ex.what();
    } catch (std::string &msg) {
        return msg;
    } catch (const char *msg) {
        return msg;
    } catch (...) {
        return "Unknown exception";
    }
}

std::string ExceptionTranslatorRegistry::tryTranslators() const {
    if (m_translators.empty()) {
        std::rethrow_exception(std::current_exception());
    } else {
        return m_translators[0]->translate(m_translators.begin() + 1, m_translators.end());
    }
}

#else  // ^^ Exceptions are enabled // Exceptions are disabled vv
std::string ExceptionTranslatorRegistry::translateActiveException() const {
    CATCH_INTERNAL_ERROR(
            "Attempted to translate active exception under "
            "CATCH_CONFIG_DISABLE_EXCEPTIONS!");
}

std::string ExceptionTranslatorRegistry::tryTranslators() const {
    CATCH_INTERNAL_ERROR(
            "Attempted to use exception translators under "
            "CATCH_CONFIG_DISABLE_EXCEPTIONS!");
}
#endif

}  // namespace Catch
// end catch_exception_translator_registry.cpp
// start catch_fatal_condition.cpp

#include <algorithm>

#if !defined(CATCH_CONFIG_WINDOWS_SEH) && !defined(CATCH_CONFIG_POSIX_SIGNALS)

namespace Catch {

// If neither SEH nor signal handling is required, the handler impls
// do not have to do anything, and can be empty.
void FatalConditionHandler::engage_platform() {}
void FatalConditionHandler::disengage_platform() {}
FatalConditionHandler::FatalConditionHandler() = default;
FatalConditionHandler::~FatalConditionHandler() = default;

}  // end namespace Catch

#endif  // !CATCH_CONFIG_WINDOWS_SEH && !CATCH_CONFIG_POSIX_SIGNALS

#if defined(CATCH_CONFIG_WINDOWS_SEH) && defined(CATCH_CONFIG_POSIX_SIGNALS)
#error "Inconsistent configuration: Windows' SEH handling and POSIX signals cannot be enabled at the same time"
#endif  // CATCH_CONFIG_WINDOWS_SEH && CATCH_CONFIG_POSIX_SIGNALS

#if defined(CATCH_CONFIG_WINDOWS_SEH) || defined(CATCH_CONFIG_POSIX_SIGNALS)

namespace {
//! Signals fatal error message to the run context
void reportFatal(char const *const message) {
    Catch::getCurrentContext().getResultCapture()->handleFatalErrorCondition(message);
}

//! Minimal size Catch2 needs for its own fatal error handling.
//! Picked anecdotally, so it might not be sufficient on all
//! platforms, and for all configurations.
constexpr std::size_t minStackSizeForErrors = 32 * 1024;
}  // end unnamed namespace

#endif  // CATCH_CONFIG_WINDOWS_SEH || CATCH_CONFIG_POSIX_SIGNALS

#if defined(CATCH_CONFIG_WINDOWS_SEH)

namespace Catch {

struct SignalDefs {
    DWORD id;
    const char *name;
};

// There is no 1-1 mapping between signals and windows exceptions.
// Windows can easily distinguish between SO and SigSegV,
// but SigInt, SigTerm, etc are handled differently.
static SignalDefs signalDefs[] = {
        {static_cast<DWORD>(EXCEPTION_ILLEGAL_INSTRUCTION), "SIGILL - Illegal instruction signal"},
        {static_cast<DWORD>(EXCEPTION_STACK_OVERFLOW), "SIGSEGV - Stack overflow"},
        {static_cast<DWORD>(EXCEPTION_ACCESS_VIOLATION), "SIGSEGV - Segmentation violation signal"},
        {static_cast<DWORD>(EXCEPTION_INT_DIVIDE_BY_ZERO), "Divide by zero error"},
};

static LONG CALLBACK handleVectoredException(PEXCEPTION_POINTERS ExceptionInfo) {
    for (auto const &def : signalDefs) {
        if (ExceptionInfo->ExceptionRecord->ExceptionCode == def.id) {
            reportFatal(def.name);
        }
    }
    // If its not an exception we care about, pass it along.
    // This stops us from eating debugger breaks etc.
    return EXCEPTION_CONTINUE_SEARCH;
}

// Since we do not support multiple instantiations, we put these
// into global variables and rely on cleaning them up in outlined
// constructors/destructors
static PVOID exceptionHandlerHandle = nullptr;

// For MSVC, we reserve part of the stack memory for handling
// memory overflow structured exception.
FatalConditionHandler::FatalConditionHandler() {
    ULONG guaranteeSize = static_cast<ULONG>(minStackSizeForErrors);
    if (!SetThreadStackGuarantee(&guaranteeSize)) {
        // We do not want to fully error out, because needing
        // the stack reserve should be rare enough anyway.
        Catch::cerr() << "Failed to reserve piece of stack."
                      << " Stack overflows will not be reported successfully.";
    }
}

// We do not attempt to unset the stack guarantee, because
// Windows does not support lowering the stack size guarantee.
FatalConditionHandler::~FatalConditionHandler() = default;

void FatalConditionHandler::engage_platform() {
    // Register as first handler in current chain
    exceptionHandlerHandle = AddVectoredExceptionHandler(1, handleVectoredException);
    if (!exceptionHandlerHandle) {
        CATCH_RUNTIME_ERROR("Could not register vectored exception handler");
    }
}

void FatalConditionHandler::disengage_platform() {
    if (!RemoveVectoredExceptionHandler(exceptionHandlerHandle)) {
        CATCH_RUNTIME_ERROR("Could not unregister vectored exception handler");
    }
    exceptionHandlerHandle = nullptr;
}

}  // end namespace Catch

#endif  // CATCH_CONFIG_WINDOWS_SEH

#if defined(CATCH_CONFIG_POSIX_SIGNALS)

#include <signal.h>

namespace Catch {

struct SignalDefs {
    int id;
    const char *name;
};

static SignalDefs signalDefs[] = {{SIGINT, "SIGINT - Terminal interrupt signal"},
                                  {SIGILL, "SIGILL - Illegal instruction signal"},
                                  {SIGFPE, "SIGFPE - Floating point error signal"},
                                  {SIGSEGV, "SIGSEGV - Segmentation violation signal"},
                                  {SIGTERM, "SIGTERM - Termination request signal"},
                                  {SIGABRT, "SIGABRT - Abort (abnormal termination) signal"}};

// Older GCCs trigger -Wmissing-field-initializers for T foo = {}
// which is zero initialization, but not explicit. We want to avoid
// that.
#if defined(__GNUC__)
#pragma GCC diagnostic push
#pragma GCC diagnostic ignored "-Wmissing-field-initializers"
#endif

static char *altStackMem = nullptr;
static std::size_t altStackSize = 0;
static stack_t oldSigStack{};
static struct sigaction oldSigActions[sizeof(signalDefs) / sizeof(SignalDefs)]{};

static void restorePreviousSignalHandlers() {
    // We set signal handlers back to the previous ones. Hopefully
    // nobody overwrote them in the meantime, and doesn't expect
    // their signal handlers to live past ours given that they
    // installed them after ours..
    for (std::size_t i = 0; i < sizeof(signalDefs) / sizeof(SignalDefs); ++i) {
        sigaction(signalDefs[i].id, &oldSigActions[i], nullptr);
    }
    // Return the old stack
    sigaltstack(&oldSigStack, nullptr);
}

static void handleSignal(int sig) {
    char const *name = "<unknown signal>";
    for (auto const &def : signalDefs) {
        if (sig == def.id) {
            name = def.name;
            break;
        }
    }
    // We need to restore previous signal handlers and let them do
    // their thing, so that the users can have the debugger break
    // when a signal is raised, and so on.
    restorePreviousSignalHandlers();
    reportFatal(name);
    raise(sig);
}

FatalConditionHandler::FatalConditionHandler() {
    assert(!altStackMem && "Cannot initialize POSIX signal handler when one already exists");
    if (altStackSize == 0) {
        altStackSize = std::max(static_cast<size_t>(SIGSTKSZ), minStackSizeForErrors);
    }
    altStackMem = new char[altStackSize]();
}

FatalConditionHandler::~FatalConditionHandler() {
    delete[] altStackMem;
    // We signal that another instance can be constructed by zeroing
    // out the pointer.
    altStackMem = nullptr;
}

void FatalConditionHandler::engage_platform() {
    stack_t sigStack;
    sigStack.ss_sp = altStackMem;
    sigStack.ss_size = altStackSize;
    sigStack.ss_flags = 0;
    sigaltstack(&sigStack, &oldSigStack);
    struct sigaction sa = {};

    sa.sa_handler = handleSignal;
    sa.sa_flags = SA_ONSTACK;
    for (std::size_t i = 0; i < sizeof(signalDefs) / sizeof(SignalDefs); ++i) {
        sigaction(signalDefs[i].id, &sa, &oldSigActions[i]);
    }
}

#if defined(__GNUC__)
#pragma GCC diagnostic pop
#endif

void FatalConditionHandler::disengage_platform() { restorePreviousSignalHandlers(); }

}  // end namespace Catch

#endif  // CATCH_CONFIG_POSIX_SIGNALS
// end catch_fatal_condition.cpp
// start catch_generators.cpp

#include <limits>
#include <set>

namespace Catch {

IGeneratorTracker::~IGeneratorTracker() {}

const char *GeneratorException::what() const noexcept { return m_msg; }

namespace Generators {

GeneratorUntypedBase::~GeneratorUntypedBase() {}

auto acquireGeneratorTracker(StringRef generatorName, SourceLineInfo const &lineInfo)
        -> IGeneratorTracker & {
    return getResultCapture().acquireGeneratorTracker(generatorName, lineInfo);
}

}  // namespace Generators
}  // namespace Catch
// end catch_generators.cpp
// start catch_interfaces_capture.cpp

namespace Catch {
IResultCapture::~IResultCapture() = default;
}
// end catch_interfaces_capture.cpp
// start catch_interfaces_config.cpp

namespace Catch {
IConfig::~IConfig() = default;
}
// end catch_interfaces_config.cpp
// start catch_interfaces_exception.cpp

namespace Catch {
IExceptionTranslator::~IExceptionTranslator() = default;
IExceptionTranslatorRegistry::~IExceptionTranslatorRegistry() = default;
}  // namespace Catch
// end catch_interfaces_exception.cpp
// start catch_interfaces_registry_hub.cpp

namespace Catch {
IRegistryHub::~IRegistryHub() = default;
IMutableRegistryHub::~IMutableRegistryHub() = default;
}  // namespace Catch
// end catch_interfaces_registry_hub.cpp
// start catch_interfaces_reporter.cpp

// start catch_reporter_listening.h

namespace Catch {

class ListeningReporter : public IStreamingReporter {
    using Reporters = std::vector<IStreamingReporterPtr>;
    Reporters m_listeners;
    IStreamingReporterPtr m_reporter = nullptr;
    ReporterPreferences m_preferences;

public:
    ListeningReporter();

    void addListener(IStreamingReporterPtr &&listener);
    void addReporter(IStreamingReporterPtr &&reporter);

public:  // IStreamingReporter
    ReporterPreferences getPreferences() const override;

    void noMatchingTestCases(std::string const &spec) override;

    void reportInvalidArguments(std::string const &arg) override;

    static std::set<Verbosity> getSupportedVerbosities();

#if defined(CATCH_CONFIG_ENABLE_BENCHMARKING)
    void benchmarkPreparing(std::string const &name) override;
    void benchmarkStarting(BenchmarkInfo const &benchmarkInfo) override;
    void benchmarkEnded(BenchmarkStats<> const &benchmarkStats) override;
    void benchmarkFailed(std::string const &) override;
#endif  // CATCH_CONFIG_ENABLE_BENCHMARKING

    void testRunStarting(TestRunInfo const &testRunInfo) override;
    void testGroupStarting(GroupInfo const &groupInfo) override;
    void testCaseStarting(TestCaseInfo const &testInfo) override;
    void sectionStarting(SectionInfo const &sectionInfo) override;
    void assertionStarting(AssertionInfo const &assertionInfo) override;

    // The return value indicates if the messages buffer should be cleared:
    bool assertionEnded(AssertionStats const &assertionStats) override;
    void sectionEnded(SectionStats const &sectionStats) override;
    void testCaseEnded(TestCaseStats const &testCaseStats) override;
    void testGroupEnded(TestGroupStats const &testGroupStats) override;
    void testRunEnded(TestRunStats const &testRunStats) override;

    void skipTest(TestCaseInfo const &testInfo) override;
    bool isMulti() const override;
};

}  // end namespace Catch

// end catch_reporter_listening.h
namespace Catch {

ReporterConfig::ReporterConfig(IConfigPtr const &_fullConfig)
        : m_stream(&_fullConfig->stream()), m_fullConfig(_fullConfig) {}

ReporterConfig::ReporterConfig(IConfigPtr const &_fullConfig, std::ostream &_stream)
        : m_stream(&_stream), m_fullConfig(_fullConfig) {}

std::ostream &ReporterConfig::stream() const { return *m_stream; }
IConfigPtr ReporterConfig::fullConfig() const { return m_fullConfig; }

TestRunInfo::TestRunInfo(std::string const &_name) : name(_name) {}

GroupInfo::GroupInfo(std::string const &_name, std::size_t _groupIndex, std::size_t _groupsCount)
        : name(_name), groupIndex(_groupIndex), groupsCounts(_groupsCount) {}

AssertionStats::AssertionStats(AssertionResult const &_assertionResult,
                               std::vector<MessageInfo> const &_infoMessages,
                               Totals const &_totals)
        : assertionResult(_assertionResult), infoMessages(_infoMessages), totals(_totals) {
    assertionResult.m_resultData.lazyExpression.m_transientExpression =
            _assertionResult.m_resultData.lazyExpression.m_transientExpression;

    if (assertionResult.hasMessage()) {
        // Copy message into messages list.
        // !TBD This should have been done earlier, somewhere
        MessageBuilder builder(assertionResult.getTestMacroName(), assertionResult.getSourceInfo(),
                               assertionResult.getResultType());
        builder << assertionResult.getMessage();
        builder.m_info.message = builder.m_stream.str();

        infoMessages.push_back(builder.m_info);
    }
}

AssertionStats::~AssertionStats() = default;

SectionStats::SectionStats(SectionInfo const &_sectionInfo,
                           Counts const &_assertions,
                           double _durationInSeconds,
                           bool _missingAssertions)
        : sectionInfo(_sectionInfo),
          assertions(_assertions),
          durationInSeconds(_durationInSeconds),
          missingAssertions(_missingAssertions) {}

SectionStats::~SectionStats() = default;

TestCaseStats::TestCaseStats(TestCaseInfo const &_testInfo,
                             Totals const &_totals,
                             std::string const &_stdOut,
                             std::string const &_stdErr,
                             bool _aborting)
        : testInfo(_testInfo),
          totals(_totals),
          stdOut(_stdOut),
          stdErr(_stdErr),
          aborting(_aborting) {}

TestCaseStats::~TestCaseStats() = default;

TestGroupStats::TestGroupStats(GroupInfo const &_groupInfo, Totals const &_totals, bool _aborting)
        : groupInfo(_groupInfo), totals(_totals), aborting(_aborting) {}

TestGroupStats::TestGroupStats(GroupInfo const &_groupInfo)
        : groupInfo(_groupInfo), aborting(false) {}

TestGroupStats::~TestGroupStats() = default;

TestRunStats::TestRunStats(TestRunInfo const &_runInfo, Totals const &_totals, bool _aborting)
        : runInfo(_runInfo), totals(_totals), aborting(_aborting) {}

TestRunStats::~TestRunStats() = default;

void IStreamingReporter::fatalErrorEncountered(StringRef) {}
bool IStreamingReporter::isMulti() const { return false; }

IReporterFactory::~IReporterFactory() = default;
IReporterRegistry::~IReporterRegistry() = default;

}  // end namespace Catch
// end catch_interfaces_reporter.cpp
// start catch_interfaces_runner.cpp

namespace Catch {
IRunner::~IRunner() = default;
}
// end catch_interfaces_runner.cpp
// start catch_interfaces_testcase.cpp

namespace Catch {
ITestInvoker::~ITestInvoker() = default;
ITestCaseRegistry::~ITestCaseRegistry() = default;
}  // namespace Catch
// end catch_interfaces_testcase.cpp
// start catch_leak_detector.cpp

#ifdef CATCH_CONFIG_WINDOWS_CRTDBG
#include <crtdbg.h>

namespace Catch {

LeakDetector::LeakDetector() {
    int flag = _CrtSetDbgFlag(_CRTDBG_REPORT_FLAG);
    flag |= _CRTDBG_LEAK_CHECK_DF;
    flag |= _CRTDBG_ALLOC_MEM_DF;
    _CrtSetDbgFlag(flag);
    _CrtSetReportMode(_CRT_WARN, _CRTDBG_MODE_FILE | _CRTDBG_MODE_DEBUG);
    _CrtSetReportFile(_CRT_WARN, _CRTDBG_FILE_STDERR);
    // Change this to leaking allocation's number to break there
    _CrtSetBreakAlloc(-1);
}
}  // namespace Catch

#else

Catch::LeakDetector::LeakDetector() {}

#endif

Catch::LeakDetector::~LeakDetector() { Catch::cleanUp(); }
// end catch_leak_detector.cpp
// start catch_list.cpp

// start catch_list.h

#include <set>

namespace Catch {

std::size_t listTests(Config const &config);

std::size_t listTestsNamesOnly(Config const &config);

struct TagInfo {
    void add(std::string const &spelling);
    std::string all() const;

    std::set<std::string> spellings;
    std::size_t count = 0;
};

std::size_t listTags(Config const &config);

std::size_t listReporters();

Option<std::size_t> list(std::shared_ptr<Config> const &config);

}  // end namespace Catch

// end catch_list.h
// start catch_text.h

namespace Catch {
using namespace clara::TextFlow;
}

// end catch_text.h
#include <algorithm>
#include <iomanip>
#include <limits>

namespace Catch {

std::size_t listTests(Config const &config) {
    TestSpec const &testSpec = config.testSpec();
    if (config.hasTestFilters())
        Catch::cout() << "Matching test cases:\n";
    else {
        Catch::cout() << "All available test cases:\n";
    }

    auto matchedTestCases = filterTests(getAllTestCasesSorted(config), testSpec, config);
    for (auto const &testCaseInfo : matchedTestCases) {
        Colour::Code colour = testCaseInfo.isHidden() ? Colour::SecondaryText : Colour::None;
        Colour colourGuard(colour);

        Catch::cout() << Column(testCaseInfo.name).initialIndent(2).indent(4) << "\n";
        if (config.verbosity() >= Verbosity::High) {
            Catch::cout() << Column(Catch::Detail::stringify(testCaseInfo.lineInfo)).indent(4)
                          << std::endl;
            std::string description = testCaseInfo.description;
            if (description.empty())
                description = "(NO DESCRIPTION)";
            Catch::cout() << Column(description).indent(4) << std::endl;
        }
        if (!testCaseInfo.tags.empty())
            Catch::cout() << Column(testCaseInfo.tagsAsString()).indent(6) << "\n";
    }

    if (!config.hasTestFilters())
        Catch::cout() << pluralise(matchedTestCases.size(), "test case") << '\n' << std::endl;
    else
        Catch::cout() << pluralise(matchedTestCases.size(), "matching test case") << '\n'
                      << std::endl;
    return matchedTestCases.size();
}

std::size_t listTestsNamesOnly(Config const &config) {
    TestSpec const &testSpec = config.testSpec();
    std::size_t matchedTests = 0;
    std::vector<TestCase> matchedTestCases =
            filterTests(getAllTestCasesSorted(config), testSpec, config);
    for (auto const &testCaseInfo : matchedTestCases) {
        matchedTests++;
        if (startsWith(testCaseInfo.name, '#'))
            Catch::cout() << '"' << testCaseInfo.name << '"';
        else
            Catch::cout() << testCaseInfo.name;
        if (config.verbosity() >= Verbosity::High)
            Catch::cout() << "\t@" << testCaseInfo.lineInfo;
        Catch::cout() << std::endl;
    }
    return matchedTests;
}

void TagInfo::add(std::string const &spelling) {
    ++count;
    spellings.insert(spelling);
}

std::string TagInfo::all() const {
    size_t size = 0;
    for (auto const &spelling : spellings) {
        // Add 2 for the brackes
        size += spelling.size() + 2;
    }

    std::string out;
    out.reserve(size);
    for (auto const &spelling : spellings) {
        out += '[';
        out += spelling;
        out += ']';
    }
    return out;
}

std::size_t listTags(Config const &config) {
    TestSpec const &testSpec = config.testSpec();
    if (config.hasTestFilters())
        Catch::cout() << "Tags for matching test cases:\n";
    else {
        Catch::cout() << "All available tags:\n";
    }

    std::map<std::string, TagInfo> tagCounts;

    std::vector<TestCase> matchedTestCases =
            filterTests(getAllTestCasesSorted(config), testSpec, config);
    for (auto const &testCase : matchedTestCases) {
        for (auto const &tagName : testCase.getTestCaseInfo().tags) {
            std::string lcaseTagName = toLower(tagName);
            auto countIt = tagCounts.find(lcaseTagName);
            if (countIt == tagCounts.end())
                countIt = tagCounts.insert(std::make_pair(lcaseTagName, TagInfo())).first;
            countIt->second.add(tagName);
        }
    }

    for (auto const &tagCount : tagCounts) {
        ReusableStringStream rss;
        rss << "  " << std::setw(2) << tagCount.second.count << "  ";
        auto str = rss.str();
        auto wrapper = Column(tagCount.second.all())
                               .initialIndent(0)
                               .indent(str.size())
                               .width(CATCH_CONFIG_CONSOLE_WIDTH - 10);
        Catch::cout() << str << wrapper << '\n';
    }
    Catch::cout() << pluralise(tagCounts.size(), "tag") << '\n' << std::endl;
    return tagCounts.size();
}

std::size_t listReporters() {
    Catch::cout() << "Available reporters:\n";
    IReporterRegistry::FactoryMap const &factories =
            getRegistryHub().getReporterRegistry().getFactories();
    std::size_t maxNameLen = 0;
    for (auto const &factoryKvp : factories)
        maxNameLen = (std::max)(maxNameLen, factoryKvp.first.size());

    for (auto const &factoryKvp : factories) {
        Catch::cout() << Column(factoryKvp.first + ":").indent(2).width(5 + maxNameLen) +
                                 Column(factoryKvp.second->getDescription())
                                         .initialIndent(0)
                                         .indent(2)
                                         .width(CATCH_CONFIG_CONSOLE_WIDTH - maxNameLen - 8)
                      << "\n";
    }
    Catch::cout() << std::endl;
    return factories.size();
}

Option<std::size_t> list(std::shared_ptr<Config> const &config) {
    Option<std::size_t> listedCount;
    getCurrentMutableContext().setConfig(config);
    if (config->listTests())
        listedCount = listedCount.valueOr(0) + listTests(*config);
    if (config->listTestNamesOnly())
        listedCount = listedCount.valueOr(0) + listTestsNamesOnly(*config);
    if (config->listTags())
        listedCount = listedCount.valueOr(0) + listTags(*config);
    if (config->listReporters())
        listedCount = listedCount.valueOr(0) + listReporters();
    return listedCount;
}

}  // end namespace Catch
// end catch_list.cpp
// start catch_matchers.cpp

namespace Catch {
namespace Matchers {
namespace Impl {

std::string MatcherUntypedBase::toString() const {
    if (m_cachedToString.empty())
        m_cachedToString = describe();
    return m_cachedToString;
}

MatcherUntypedBase::~MatcherUntypedBase() = default;

}  // namespace Impl
}  // namespace Matchers

using namespace Matchers;
using Matchers::Impl::MatcherBase;

}  // namespace Catch
// end catch_matchers.cpp
// start catch_matchers_exception.cpp

namespace Catch {
namespace Matchers {
namespace Exception {

bool ExceptionMessageMatcher::match(std::exception const &ex) const {
    return ex.what() == m_message;
}

std::string ExceptionMessageMatcher::describe() const {
    return "exception message matches \"" + m_message + "\"";
}

}  // namespace Exception
Exception::ExceptionMessageMatcher Message(std::string const &message) {
    return Exception::ExceptionMessageMatcher(message);
}

// namespace Exception
}  // namespace Matchers
}  // namespace Catch
// end catch_matchers_exception.cpp
// start catch_matchers_floating.cpp

// start catch_polyfills.hpp

namespace Catch {
bool isnan(float f);
bool isnan(double d);
}  // namespace Catch

// end catch_polyfills.hpp
// start catch_to_string.hpp

#include <string>

namespace Catch {
template <typename T>
std::string to_string(T const &t) {
#if defined(CATCH_CONFIG_CPP11_TO_STRING)
    return std::to_string(t);
#else
    ReusableStringStream rss;
    rss << t;
    return rss.str();
#endif
}
}  // end namespace Catch

// end catch_to_string.hpp
#include <algorithm>
#include <cmath>
#include <cstdint>
#include <cstdlib>
#include <cstring>
#include <iomanip>
#include <limits>
#include <sstream>
#include <type_traits>

namespace Catch {
namespace {

int32_t convert(float f) {
    static_assert(sizeof(float) == sizeof(int32_t), "Important ULP matcher assumption violated");
    int32_t i;
    std::memcpy(&i, &f, sizeof(f));
    return i;
}

int64_t convert(double d) {
    static_assert(sizeof(double) == sizeof(int64_t), "Important ULP matcher assumption violated");
    int64_t i;
    std::memcpy(&i, &d, sizeof(d));
    return i;
}

template <typename FP>
bool almostEqualUlps(FP lhs, FP rhs, uint64_t maxUlpDiff) {
    // Comparison with NaN should always be false.
    // This way we can rule it out before getting into the ugly details
    if (Catch::isnan(lhs) || Catch::isnan(rhs)) {
        return false;
    }

    auto lc = convert(lhs);
    auto rc = convert(rhs);

    if ((lc < 0) != (rc < 0)) {
        // Potentially we can have +0 and -0
        return lhs == rhs;
    }

    // static cast as a workaround for IBM XLC
    auto ulpDiff = std::abs(static_cast<FP>(lc - rc));
    return static_cast<uint64_t>(ulpDiff) <= maxUlpDiff;
}

#if defined(CATCH_CONFIG_GLOBAL_NEXTAFTER)

float nextafter(float x, float y) { return ::nextafterf(x, y); }

double nextafter(double x, double y) { return ::nextafter(x, y); }

#endif  // ^^^ CATCH_CONFIG_GLOBAL_NEXTAFTER ^^^

template <typename FP>
FP step(FP start, FP direction, uint64_t steps) {
    for (uint64_t i = 0; i < steps; ++i) {
#if defined(CATCH_CONFIG_GLOBAL_NEXTAFTER)
        start = Catch::nextafter(start, direction);
#else
        start = std::nextafter(start, direction);
#endif
    }
    return start;
}

// Performs equivalent check of std::fabs(lhs - rhs) <= margin
// But without the subtraction to allow for INFINITY in comparison
bool marginComparison(double lhs, double rhs, double margin) {
    return (lhs + margin >= rhs) && (rhs + margin >= lhs);
}

template <typename FloatingPoint>
void write(std::ostream &out, FloatingPoint num) {
    out << std::scientific
        << std::setprecision(std::numeric_limits<FloatingPoint>::max_digits10 - 1) << num;
}

}  // end anonymous namespace

namespace Matchers {
namespace Floating {

enum class FloatingPointKind : uint8_t { Float, Double };

WithinAbsMatcher::WithinAbsMatcher(double target, double margin)
        : m_target{target}, m_margin{margin} {
    CATCH_ENFORCE(margin >= 0,
                  "Invalid margin: " << margin << '.' << " Margin has to be non-negative.");
}

// Performs equivalent check of std::fabs(lhs - rhs) <= margin
// But without the subtraction to allow for INFINITY in comparison
bool WithinAbsMatcher::match(double const &matchee) const {
    return (matchee + m_margin >= m_target) && (m_target + m_margin >= matchee);
}

std::string WithinAbsMatcher::describe() const {
    return "is within " + ::Catch::Detail::stringify(m_margin) + " of " +
           ::Catch::Detail::stringify(m_target);
}

WithinUlpsMatcher::WithinUlpsMatcher(double target, uint64_t ulps, FloatingPointKind baseType)
        : m_target{target}, m_ulps{ulps}, m_type{baseType} {
    CATCH_ENFORCE(
            m_type == FloatingPointKind::Double || m_ulps < (std::numeric_limits<uint32_t>::max)(),
            "Provided ULP is impossibly large for a float comparison.");
}

#if defined(__clang__)
#pragma clang diagnostic push
// Clang <3.5 reports on the default branch in the switch below
#pragma clang diagnostic ignored "-Wunreachable-code"
#endif

bool WithinUlpsMatcher::match(double const &matchee) const {
    switch (m_type) {
    case FloatingPointKind::Float:
        return almostEqualUlps<float>(static_cast<float>(matchee), static_cast<float>(m_target),
                                      m_ulps);
    case FloatingPointKind::Double:
        return almostEqualUlps<double>(matchee, m_target, m_ulps);
    default:
        CATCH_INTERNAL_ERROR("Unknown FloatingPointKind value");
    }
}

#if defined(__clang__)
#pragma clang diagnostic pop
#endif

std::string WithinUlpsMatcher::describe() const {
    std::stringstream ret;

    ret << "is within " << m_ulps << " ULPs of ";

    if (m_type == FloatingPointKind::Float) {
        write(ret, static_cast<float>(m_target));
        ret << 'f';
    } else {
        write(ret, m_target);
    }

    ret << " ([";
    if (m_type == FloatingPointKind::Double) {
        write(ret, step(m_target, static_cast<double>(-INFINITY), m_ulps));
        ret << ", ";
        write(ret, step(m_target, static_cast<double>(INFINITY), m_ulps));
    } else {
        // We have to cast INFINITY to float because of MinGW, see #1782
        write(ret, step(static_cast<float>(m_target), static_cast<float>(-INFINITY), m_ulps));
        ret << ", ";
        write(ret, step(static_cast<float>(m_target), static_cast<float>(INFINITY), m_ulps));
    }
    ret << "])";

    return ret.str();
}

WithinRelMatcher::WithinRelMatcher(double target, double epsilon)
        : m_target(target), m_epsilon(epsilon) {
    CATCH_ENFORCE(m_epsilon >= 0., "Relative comparison with epsilon <  0 does not make sense.");
    CATCH_ENFORCE(m_epsilon < 1., "Relative comparison with epsilon >= 1 does not make sense.");
}

bool WithinRelMatcher::match(double const &matchee) const {
    const auto relMargin = m_epsilon * (std::max)(std::fabs(matchee), std::fabs(m_target));
    return marginComparison(matchee, m_target, std::isinf(relMargin) ? 0 : relMargin);
}

std::string WithinRelMatcher::describe() const {
    Catch::ReusableStringStream sstr;
    sstr << "and " << m_target << " are within " << m_epsilon * 100. << "% of each other";
    return sstr.str();
}

}  // namespace Floating

Floating::WithinUlpsMatcher WithinULP(double target, uint64_t maxUlpDiff) {
    return Floating::WithinUlpsMatcher(target, maxUlpDiff, Floating::FloatingPointKind::Double);
}

Floating::WithinUlpsMatcher WithinULP(float target, uint64_t maxUlpDiff) {
    return Floating::WithinUlpsMatcher(target, maxUlpDiff, Floating::FloatingPointKind::Float);
}

Floating::WithinAbsMatcher WithinAbs(double target, double margin) {
    return Floating::WithinAbsMatcher(target, margin);
}

Floating::WithinRelMatcher WithinRel(double target, double eps) {
    return Floating::WithinRelMatcher(target, eps);
}

Floating::WithinRelMatcher WithinRel(double target) {
    return Floating::WithinRelMatcher(target, std::numeric_limits<double>::epsilon() * 100);
}

Floating::WithinRelMatcher WithinRel(float target, float eps) {
    return Floating::WithinRelMatcher(target, eps);
}

Floating::WithinRelMatcher WithinRel(float target) {
    return Floating::WithinRelMatcher(target, std::numeric_limits<float>::epsilon() * 100);
}

}  // namespace Matchers
}  // namespace Catch
// end catch_matchers_floating.cpp
// start catch_matchers_generic.cpp

std::string Catch::Matchers::Generic::Detail::finalizeDescription(const std::string &desc) {
    if (desc.empty()) {
        return "matches undescribed predicate";
    } else {
        return "matches predicate: \"" + desc + '"';
    }
}
// end catch_matchers_generic.cpp
// start catch_matchers_string.cpp

#include <regex>

namespace Catch {
namespace Matchers {

namespace StdString {

CasedString::CasedString(std::string const &str, CaseSensitive::Choice caseSensitivity)
        : m_caseSensitivity(caseSensitivity), m_str(adjustString(str)) {}
std::string CasedString::adjustString(std::string const &str) const {
    return m_caseSensitivity == CaseSensitive::No ? toLower(str) : str;
}
std::string CasedString::caseSensitivitySuffix() const {
    return m_caseSensitivity == CaseSensitive::No ? " (case insensitive)" : std::string();
}

StringMatcherBase::StringMatcherBase(std::string const &operation, CasedString const &comparator)
        : m_comparator(comparator), m_operation(operation) {}

std::string StringMatcherBase::describe() const {
    std::string description;
    description.reserve(5 + m_operation.size() + m_comparator.m_str.size() +
                        m_comparator.caseSensitivitySuffix().size());
    description += m_operation;
    description += ": \"";
    description += m_comparator.m_str;
    description += "\"";
    description += m_comparator.caseSensitivitySuffix();
    return description;
}

EqualsMatcher::EqualsMatcher(CasedString const &comparator)
        : StringMatcherBase("equals", comparator) {}

bool EqualsMatcher::match(std::string const &source) const {
    return m_comparator.adjustString(source) == m_comparator.m_str;
}

ContainsMatcher::ContainsMatcher(CasedString const &comparator)
        : StringMatcherBase("contains", comparator) {}

bool ContainsMatcher::match(std::string const &source) const {
    return contains(m_comparator.adjustString(source), m_comparator.m_str);
}

StartsWithMatcher::StartsWithMatcher(CasedString const &comparator)
        : StringMatcherBase("starts with", comparator) {}

bool StartsWithMatcher::match(std::string const &source) const {
    return startsWith(m_comparator.adjustString(source), m_comparator.m_str);
}

EndsWithMatcher::EndsWithMatcher(CasedString const &comparator)
        : StringMatcherBase("ends with", comparator) {}

bool EndsWithMatcher::match(std::string const &source) const {
    return endsWith(m_comparator.adjustString(source), m_comparator.m_str);
}

RegexMatcher::RegexMatcher(std::string regex, CaseSensitive::Choice caseSensitivity)
        : m_regex(std::move(regex)), m_caseSensitivity(caseSensitivity) {}

bool RegexMatcher::match(std::string const &matchee) const {
    auto flags = std::regex::ECMAScript;  // ECMAScript is the default syntax option anyway
    if (m_caseSensitivity == CaseSensitive::Choice::No) {
        flags |= std::regex::icase;
    }
    auto reg = std::regex(m_regex, flags);
    return std::regex_match(matchee, reg);
}

std::string RegexMatcher::describe() const {
    return "matches " + ::Catch::Detail::stringify(m_regex) +
           ((m_caseSensitivity == CaseSensitive::Choice::Yes) ? " case sensitively"
                                                              : " case insensitively");
}

}  // namespace StdString

StdString::EqualsMatcher Equals(std::string const &str, CaseSensitive::Choice caseSensitivity) {
    return StdString::EqualsMatcher(StdString::CasedString(str, caseSensitivity));
}
StdString::ContainsMatcher Contains(std::string const &str, CaseSensitive::Choice caseSensitivity) {
    return StdString::ContainsMatcher(StdString::CasedString(str, caseSensitivity));
}
StdString::EndsWithMatcher EndsWith(std::string const &str, CaseSensitive::Choice caseSensitivity) {
    return StdString::EndsWithMatcher(StdString::CasedString(str, caseSensitivity));
}
StdString::StartsWithMatcher StartsWith(std::string const &str,
                                        CaseSensitive::Choice caseSensitivity) {
    return StdString::StartsWithMatcher(StdString::CasedString(str, caseSensitivity));
}

StdString::RegexMatcher Matches(std::string const &regex, CaseSensitive::Choice caseSensitivity) {
    return StdString::RegexMatcher(regex, caseSensitivity);
}

}  // namespace Matchers
}  // namespace Catch
// end catch_matchers_string.cpp
// start catch_message.cpp

// start catch_uncaught_exceptions.h

namespace Catch {
bool uncaught_exceptions();
}  // end namespace Catch

// end catch_uncaught_exceptions.h
#include <cassert>
#include <stack>

namespace Catch {

MessageInfo::MessageInfo(StringRef const &_macroName,
                         SourceLineInfo const &_lineInfo,
                         ResultWas::OfType _type)
        : macroName(_macroName), lineInfo(_lineInfo), type(_type), sequence(++globalCount) {}

bool MessageInfo::operator==(MessageInfo const &other) const { return sequence == other.sequence; }

bool MessageInfo::operator<(MessageInfo const &other) const { return sequence < other.sequence; }

// This may need protecting if threading support is added
unsigned int MessageInfo::globalCount = 0;

////////////////////////////////////////////////////////////////////////////

Catch::MessageBuilder::MessageBuilder(StringRef const &macroName,
                                      SourceLineInfo const &lineInfo,
                                      ResultWas::OfType type)
        : m_info(macroName, lineInfo, type) {}

////////////////////////////////////////////////////////////////////////////

ScopedMessage::ScopedMessage(MessageBuilder const &builder) : m_info(builder.m_info), m_moved() {
    m_info.message = builder.m_stream.str();
    getResultCapture().pushScopedMessage(m_info);
}

ScopedMessage::ScopedMessage(ScopedMessage &&old) : m_info(old.m_info), m_moved() {
    old.m_moved = true;
}

ScopedMessage::~ScopedMessage() {
    if (!uncaught_exceptions() && !m_moved) {
        getResultCapture().popScopedMessage(m_info);
    }
}

Capturer::Capturer(StringRef macroName,
                   SourceLineInfo const &lineInfo,
                   ResultWas::OfType resultType,
                   StringRef names) {
    auto trimmed = [&](size_t start, size_t end) {
        while (names[start] == ',' || isspace(static_cast<unsigned char>(names[start]))) {
            ++start;
        }
        while (names[end] == ',' || isspace(static_cast<unsigned char>(names[end]))) {
            --end;
        }
        return names.substr(start, end - start + 1);
    };
    auto skipq = [&](size_t start, char quote) {
        for (auto i = start + 1; i < names.size(); ++i) {
            if (names[i] == quote)
                return i;
            if (names[i] == '\\')
                ++i;
        }
        CATCH_INTERNAL_ERROR("CAPTURE parsing encountered unmatched quote");
    };

    size_t start = 0;
    std::stack<char> openings;
    for (size_t pos = 0; pos < names.size(); ++pos) {
        char c = names[pos];
        switch (c) {
        case '[':
        case '{':
        case '(':
            // It is basically impossible to disambiguate between
            // comparison and start of template args in this context
            //            case '<':
            openings.push(c);
            break;
        case ']':
        case '}':
        case ')':
            //           case '>':
            openings.pop();
            break;
        case '"':
        case '\'':
            pos = skipq(pos, c);
            break;
        case ',':
            if (start != pos && openings.empty()) {
                m_messages.emplace_back(macroName, lineInfo, resultType);
                m_messages.back().message = static_cast<std::string>(trimmed(start, pos));
                m_messages.back().message += " := ";
                start = pos;
            }
        }
    }
    assert(openings.empty() && "Mismatched openings");
    m_messages.emplace_back(macroName, lineInfo, resultType);
    m_messages.back().message = static_cast<std::string>(trimmed(start, names.size() - 1));
    m_messages.back().message += " := ";
}
Capturer::~Capturer() {
    if (!uncaught_exceptions()) {
        assert(m_captured == m_messages.size());
        for (size_t i = 0; i < m_captured; ++i)
            m_resultCapture.popScopedMessage(m_messages[i]);
    }
}

void Capturer::captureValue(size_t index, std::string const &value) {
    assert(index < m_messages.size());
    m_messages[index].message += value;
    m_resultCapture.pushScopedMessage(m_messages[index]);
    m_captured++;
}

}  // end namespace Catch
// end catch_message.cpp
// start catch_output_redirect.cpp

// start catch_output_redirect.h
#ifndef TWOBLUECUBES_CATCH_OUTPUT_REDIRECT_H
#define TWOBLUECUBES_CATCH_OUTPUT_REDIRECT_H

#include <cstdio>
#include <iosfwd>
#include <string>

namespace Catch {

class RedirectedStream {
    std::ostream &m_originalStream;
    std::ostream &m_redirectionStream;
    std::streambuf *m_prevBuf;

public:
    RedirectedStream(std::ostream &originalStream, std::ostream &redirectionStream);
    ~RedirectedStream();
};

class RedirectedStdOut {
    ReusableStringStream m_rss;
    RedirectedStream m_cout;

public:
    RedirectedStdOut();
    auto str() const -> std::string;
};

// StdErr has two constituent streams in C++, std::cerr and std::clog
// This means that we need to redirect 2 streams into 1 to keep proper
// order of writes
class RedirectedStdErr {
    ReusableStringStream m_rss;
    RedirectedStream m_cerr;
    RedirectedStream m_clog;

public:
    RedirectedStdErr();
    auto str() const -> std::string;
};

class RedirectedStreams {
public:
    RedirectedStreams(RedirectedStreams const &) = delete;
    RedirectedStreams &operator=(RedirectedStreams const &) = delete;
    RedirectedStreams(RedirectedStreams &&) = delete;
    RedirectedStreams &operator=(RedirectedStreams &&) = delete;

    RedirectedStreams(std::string &redirectedCout, std::string &redirectedCerr);
    ~RedirectedStreams();

private:
    std::string &m_redirectedCout;
    std::string &m_redirectedCerr;
    RedirectedStdOut m_redirectedStdOut;
    RedirectedStdErr m_redirectedStdErr;
};

#if defined(CATCH_CONFIG_NEW_CAPTURE)

// Windows's implementation of std::tmpfile is terrible (it tries
// to create a file inside system folder, thus requiring elevated
// privileges for the binary), so we have to use tmpnam(_s) and
// create the file ourselves there.
class TempFile {
public:
    TempFile(TempFile const &) = delete;
    TempFile &operator=(TempFile const &) = delete;
    TempFile(TempFile &&) = delete;
    TempFile &operator=(TempFile &&) = delete;

    TempFile();
    ~TempFile();

    std::FILE *getFile();
    std::string getContents();

private:
    std::FILE *m_file = nullptr;
#if defined(_MSC_VER)
    char m_buffer[L_tmpnam] = {0};
#endif
};

class OutputRedirect {
public:
    OutputRedirect(OutputRedirect const &) = delete;
    OutputRedirect &operator=(OutputRedirect const &) = delete;
    OutputRedirect(OutputRedirect &&) = delete;
    OutputRedirect &operator=(OutputRedirect &&) = delete;

    OutputRedirect(std::string &stdout_dest, std::string &stderr_dest);
    ~OutputRedirect();

private:
    int m_originalStdout = -1;
    int m_originalStderr = -1;
    TempFile m_stdoutFile;
    TempFile m_stderrFile;
    std::string &m_stdoutDest;
    std::string &m_stderrDest;
};

#endif

}  // end namespace Catch

#endif  // TWOBLUECUBES_CATCH_OUTPUT_REDIRECT_H
// end catch_output_redirect.h
#include <cstdio>
#include <cstring>
#include <fstream>
#include <sstream>
#include <stdexcept>

#if defined(CATCH_CONFIG_NEW_CAPTURE)
#if defined(_MSC_VER)
#include <io.h>  //_dup and _dup2
#define dup _dup
#define dup2 _dup2
#define fileno _fileno
#else
#include <unistd.h>  // dup and dup2
#endif
#endif

namespace Catch {

RedirectedStream::RedirectedStream(std::ostream &originalStream, std::ostream &redirectionStream)
        : m_originalStream(originalStream),
          m_redirectionStream(redirectionStream),
          m_prevBuf(m_originalStream.rdbuf()) {
    m_originalStream.rdbuf(m_redirectionStream.rdbuf());
}

RedirectedStream::~RedirectedStream() { m_originalStream.rdbuf(m_prevBuf); }

RedirectedStdOut::RedirectedStdOut() : m_cout(Catch::cout(), m_rss.get()) {}
auto RedirectedStdOut::str() const -> std::string { return m_rss.str(); }

RedirectedStdErr::RedirectedStdErr()
        : m_cerr(Catch::cerr(), m_rss.get()), m_clog(Catch::clog(), m_rss.get()) {}
auto RedirectedStdErr::str() const -> std::string { return m_rss.str(); }

RedirectedStreams::RedirectedStreams(std::string &redirectedCout, std::string &redirectedCerr)
        : m_redirectedCout(redirectedCout), m_redirectedCerr(redirectedCerr) {}

RedirectedStreams::~RedirectedStreams() {
    m_redirectedCout += m_redirectedStdOut.str();
    m_redirectedCerr += m_redirectedStdErr.str();
}

#if defined(CATCH_CONFIG_NEW_CAPTURE)

#if defined(_MSC_VER)
TempFile::TempFile() {
    if (tmpnam_s(m_buffer)) {
        CATCH_RUNTIME_ERROR("Could not get a temp filename");
    }
    if (fopen_s(&m_file, m_buffer, "w+")) {
        char buffer[100];
        if (strerror_s(buffer, errno)) {
            CATCH_RUNTIME_ERROR("Could not translate errno to a string");
        }
        CATCH_RUNTIME_ERROR("Could not open the temp file: '" << m_buffer
                                                              << "' because: " << buffer);
    }
}
#else
TempFile::TempFile() {
    m_file = std::tmpfile();
    if (!m_file) {
        CATCH_RUNTIME_ERROR("Could not create a temp file.");
    }
}

#endif

TempFile::~TempFile() {
    // TBD: What to do about errors here?
    std::fclose(m_file);
    // We manually create the file on Windows only, on Linux
    // it will be autodeleted
#if defined(_MSC_VER)
    std::remove(m_buffer);
#endif
}

FILE *TempFile::getFile() { return m_file; }

std::string TempFile::getContents() {
    std::stringstream sstr;
    char buffer[100] = {};
    std::rewind(m_file);
    while (std::fgets(buffer, sizeof(buffer), m_file)) {
        sstr << buffer;
    }
    return sstr.str();
}

OutputRedirect::OutputRedirect(std::string &stdout_dest, std::string &stderr_dest)
        : m_originalStdout(dup(1)),
          m_originalStderr(dup(2)),
          m_stdoutDest(stdout_dest),
          m_stderrDest(stderr_dest) {
    dup2(fileno(m_stdoutFile.getFile()), 1);
    dup2(fileno(m_stderrFile.getFile()), 2);
}

OutputRedirect::~OutputRedirect() {
    Catch::cout() << std::flush;
    fflush(stdout);
    // Since we support overriding these streams, we flush cerr
    // even though std::cerr is unbuffered
    Catch::cerr() << std::flush;
    Catch::clog() << std::flush;
    fflush(stderr);

    dup2(m_originalStdout, 1);
    dup2(m_originalStderr, 2);

    m_stdoutDest += m_stdoutFile.getContents();
    m_stderrDest += m_stderrFile.getContents();
}

#endif  // CATCH_CONFIG_NEW_CAPTURE

}  // namespace Catch

#if defined(CATCH_CONFIG_NEW_CAPTURE)
#if defined(_MSC_VER)
#undef dup
#undef dup2
#undef fileno
#endif
#endif
// end catch_output_redirect.cpp
// start catch_polyfills.cpp

#include <cmath>

namespace Catch {

#if !defined(CATCH_CONFIG_POLYFILL_ISNAN)
bool isnan(float f) { return std::isnan(f); }
bool isnan(double d) { return std::isnan(d); }
#else
// For now we only use this for embarcadero
bool isnan(float f) { return std::_isnan(f); }
bool isnan(double d) { return std::_isnan(d); }
#endif

}  // end namespace Catch
// end catch_polyfills.cpp
// start catch_random_number_generator.cpp

namespace Catch {

namespace {

#if defined(_MSC_VER)
#pragma warning(push)
#pragma warning(disable : 4146)  // we negate uint32 during the rotate
#endif
// Safe rotr implementation thanks to John Regehr
uint32_t rotate_right(uint32_t val, uint32_t count) {
    const uint32_t mask = 31;
    count &= mask;
    return (val >> count) | (val << (-count & mask));
}

#if defined(_MSC_VER)
#pragma warning(pop)
#endif

}  // namespace

SimplePcg32::SimplePcg32(result_type seed_) { seed(seed_); }

void SimplePcg32::seed(result_type seed_) {
    m_state = 0;
    (*this)();
    m_state += seed_;
    (*this)();
}

void SimplePcg32::discard(uint64_t skip) {
    // We could implement this to run in O(log n) steps, but this
    // should suffice for our use case.
    for (uint64_t s = 0; s < skip; ++s) {
        static_cast<void>((*this)());
    }
}

SimplePcg32::result_type SimplePcg32::operator()() {
    // prepare the output value
    const uint32_t xorshifted = static_cast<uint32_t>(((m_state >> 18u) ^ m_state) >> 27u);
    const auto output = rotate_right(xorshifted, m_state >> 59u);

    // advance state
    m_state = m_state * 6364136223846793005ULL + s_inc;

    return output;
}

bool operator==(SimplePcg32 const &lhs, SimplePcg32 const &rhs) {
    return lhs.m_state == rhs.m_state;
}

bool operator!=(SimplePcg32 const &lhs, SimplePcg32 const &rhs) {
    return lhs.m_state != rhs.m_state;
}
}  // namespace Catch
// end catch_random_number_generator.cpp
// start catch_registry_hub.cpp

// start catch_test_case_registry_impl.h

#include <algorithm>
#include <ios>
#include <set>
#include <vector>

namespace Catch {

class TestCase;
struct IConfig;

std::vector<TestCase> sortTests(IConfig const &config,
                                std::vector<TestCase> const &unsortedTestCases);

bool isThrowSafe(TestCase const &testCase, IConfig const &config);
bool matchTest(TestCase const &testCase, TestSpec const &testSpec, IConfig const &config);

void enforceNoDuplicateTestCases(std::vector<TestCase> const &functions);

std::vector<TestCase> filterTests(std::vector<TestCase> const &testCases,
                                  TestSpec const &testSpec,
                                  IConfig const &config);
std::vector<TestCase> const &getAllTestCasesSorted(IConfig const &config);

class TestRegistry : public ITestCaseRegistry {
public:
    virtual ~TestRegistry() = default;

    virtual void registerTest(TestCase const &testCase);

    std::vector<TestCase> const &getAllTests() const override;
    std::vector<TestCase> const &getAllTestsSorted(IConfig const &config) const override;

private:
    std::vector<TestCase> m_functions;
    mutable RunTests::InWhatOrder m_currentSortOrder = RunTests::InDeclarationOrder;
    mutable std::vector<TestCase> m_sortedFunctions;
    std::size_t m_unnamedCount = 0;
    std::ios_base::Init m_ostreamInit;  // Forces cout/ cerr to be initialised
};

///////////////////////////////////////////////////////////////////////////

class TestInvokerAsFunction : public ITestInvoker {
    void (*m_testAsFunction)();

public:
    TestInvokerAsFunction(void (*testAsFunction)()) noexcept;

    void invoke() const override;
};

std::string extractClassName(StringRef const &classOrQualifiedMethodName);

///////////////////////////////////////////////////////////////////////////

}  // end namespace Catch

// end catch_test_case_registry_impl.h
// start catch_reporter_registry.h

#include <map>

namespace Catch {

class ReporterRegistry : public IReporterRegistry {
public:
    ~ReporterRegistry() override;

    IStreamingReporterPtr create(std::string const &name, IConfigPtr const &config) const override;

    void registerReporter(std::string const &name, IReporterFactoryPtr const &factory);
    void registerListener(IReporterFactoryPtr const &factory);

    FactoryMap const &getFactories() const override;
    Listeners const &getListeners() const override;

private:
    FactoryMap m_factories;
    Listeners m_listeners;
};
}  // namespace Catch

// end catch_reporter_registry.h
// start catch_tag_alias_registry.h

// start catch_tag_alias.h

#include <string>

namespace Catch {

struct TagAlias {
    TagAlias(std::string const &_tag, SourceLineInfo _lineInfo);

    std::string tag;
    SourceLineInfo lineInfo;
};

}  // end namespace Catch

// end catch_tag_alias.h
#include <map>

namespace Catch {

class TagAliasRegistry : public ITagAliasRegistry {
public:
    ~TagAliasRegistry() override;
    TagAlias const *find(std::string const &alias) const override;
    std::string expandAliases(std::string const &unexpandedTestSpec) const override;
    void add(std::string const &alias, std::string const &tag, SourceLineInfo const &lineInfo);

private:
    std::map<std::string, TagAlias> m_registry;
};

}  // end namespace Catch

// end catch_tag_alias_registry.h
// start catch_startup_exception_registry.h

#include <exception>
#include <vector>

namespace Catch {

class StartupExceptionRegistry {
#if !defined(CATCH_CONFIG_DISABLE_EXCEPTIONS)
public:
    void add(std::exception_ptr const &exception) noexcept;
    std::vector<std::exception_ptr> const &getExceptions() const noexcept;

private:
    std::vector<std::exception_ptr> m_exceptions;
#endif
};

}  // end namespace Catch

// end catch_startup_exception_registry.h
// start catch_singletons.hpp

namespace Catch {

struct ISingleton {
    virtual ~ISingleton();
};

void addSingleton(ISingleton *singleton);
void cleanupSingletons();

template <typename SingletonImplT,
          typename InterfaceT = SingletonImplT,
          typename MutableInterfaceT = InterfaceT>
class Singleton : SingletonImplT, public ISingleton {
    static auto getInternal() -> Singleton * {
        static Singleton *s_instance = nullptr;
        if (!s_instance) {
            s_instance = new Singleton;
            addSingleton(s_instance);
        }
        return s_instance;
    }

public:
    static auto get() -> InterfaceT const & { return *getInternal(); }
    static auto getMutable() -> MutableInterfaceT & { return *getInternal(); }
};

}  // namespace Catch

// end catch_singletons.hpp
namespace Catch {

namespace {

class RegistryHub : public IRegistryHub, public IMutableRegistryHub, private NonCopyable {
public:  // IRegistryHub
    RegistryHub() = default;
    IReporterRegistry const &getReporterRegistry() const override { return m_reporterRegistry; }
    ITestCaseRegistry const &getTestCaseRegistry() const override { return m_testCaseRegistry; }
    IExceptionTranslatorRegistry const &getExceptionTranslatorRegistry() const override {
        return m_exceptionTranslatorRegistry;
    }
    ITagAliasRegistry const &getTagAliasRegistry() const override { return m_tagAliasRegistry; }
    StartupExceptionRegistry const &getStartupExceptionRegistry() const override {
        return m_exceptionRegistry;
    }

public:  // IMutableRegistryHub
    void registerReporter(std::string const &name, IReporterFactoryPtr const &factory) override {
        m_reporterRegistry.registerReporter(name, factory);
    }
    void registerListener(IReporterFactoryPtr const &factory) override {
        m_reporterRegistry.registerListener(factory);
    }
    void registerTest(TestCase const &testInfo) override {
        m_testCaseRegistry.registerTest(testInfo);
    }
    void registerTranslator(const IExceptionTranslator *translator) override {
        m_exceptionTranslatorRegistry.registerTranslator(translator);
    }
    void registerTagAlias(std::string const &alias,
                          std::string const &tag,
                          SourceLineInfo const &lineInfo) override {
        m_tagAliasRegistry.add(alias, tag, lineInfo);
    }
    void registerStartupException() noexcept override {
#if !defined(CATCH_CONFIG_DISABLE_EXCEPTIONS)
        m_exceptionRegistry.add(std::current_exception());
#else
        CATCH_INTERNAL_ERROR(
                "Attempted to register active exception under "
                "CATCH_CONFIG_DISABLE_EXCEPTIONS!");
#endif
    }
    IMutableEnumValuesRegistry &getMutableEnumValuesRegistry() override {
        return m_enumValuesRegistry;
    }

private:
    TestRegistry m_testCaseRegistry;
    ReporterRegistry m_reporterRegistry;
    ExceptionTranslatorRegistry m_exceptionTranslatorRegistry;
    TagAliasRegistry m_tagAliasRegistry;
    StartupExceptionRegistry m_exceptionRegistry;
    Detail::EnumValuesRegistry m_enumValuesRegistry;
};
}  // namespace

using RegistryHubSingleton = Singleton<RegistryHub, IRegistryHub, IMutableRegistryHub>;

IRegistryHub const &getRegistryHub() { return RegistryHubSingleton::get(); }
IMutableRegistryHub &getMutableRegistryHub() { return RegistryHubSingleton::getMutable(); }
void cleanUp() {
    cleanupSingletons();
    cleanUpContext();
}
std::string translateActiveException() {
    return getRegistryHub().getExceptionTranslatorRegistry().translateActiveException();
}

}  // end namespace Catch
// end catch_registry_hub.cpp
// start catch_reporter_registry.cpp

namespace Catch {

ReporterRegistry::~ReporterRegistry() = default;

IStreamingReporterPtr ReporterRegistry::create(std::string const &name,
                                               IConfigPtr const &config) const {
    auto it = m_factories.find(name);
    if (it == m_factories.end())
        return nullptr;
    return it->second->create(ReporterConfig(config));
}

void ReporterRegistry::registerReporter(std::string const &name,
                                        IReporterFactoryPtr const &factory) {
    m_factories.emplace(name, factory);
}
void ReporterRegistry::registerListener(IReporterFactoryPtr const &factory) {
    m_listeners.push_back(factory);
}

IReporterRegistry::FactoryMap const &ReporterRegistry::getFactories() const { return m_factories; }
IReporterRegistry::Listeners const &ReporterRegistry::getListeners() const { return m_listeners; }

}  // namespace Catch
// end catch_reporter_registry.cpp
// start catch_result_type.cpp

namespace Catch {

bool isOk(ResultWas::OfType resultType) { return (resultType & ResultWas::FailureBit) == 0; }
bool isJustInfo(int flags) { return flags == ResultWas::Info; }

ResultDisposition::Flags operator|(ResultDisposition::Flags lhs, ResultDisposition::Flags rhs) {
    return static_cast<ResultDisposition::Flags>(static_cast<int>(lhs) | static_cast<int>(rhs));
}

bool shouldContinueOnFailure(int flags) {
    return (flags & ResultDisposition::ContinueOnFailure) != 0;
}
bool shouldSuppressFailure(int flags) { return (flags & ResultDisposition::SuppressFail) != 0; }

}  // end namespace Catch
// end catch_result_type.cpp
// start catch_run_context.cpp

#include <algorithm>
#include <cassert>
#include <sstream>

namespace Catch {

namespace Generators {
struct GeneratorTracker : TestCaseTracking::TrackerBase, IGeneratorTracker {
    GeneratorBasePtr m_generator;

    GeneratorTracker(TestCaseTracking::NameAndLocation const &nameAndLocation,
                     TrackerContext &ctx,
                     ITracker *parent)
            : TrackerBase(nameAndLocation, ctx, parent) {}
    ~GeneratorTracker();

    static GeneratorTracker &acquire(TrackerContext &ctx,
                                     TestCaseTracking::NameAndLocation const &nameAndLocation) {
        std::shared_ptr<GeneratorTracker> tracker;

        ITracker &currentTracker = ctx.currentTracker();
        // Under specific circumstances, the generator we want
        // to acquire is also the current tracker. If this is
        // the case, we have to avoid looking through current
        // tracker's children, and instead return the current
        // tracker.
        // A case where this check is important is e.g.
        //     for (int i = 0; i < 5; ++i) {
        //         int n = GENERATE(1, 2);
        //     }
        //
        // without it, the code above creates 5 nested generators.
        if (currentTracker.nameAndLocation() == nameAndLocation) {
            auto thisTracker = currentTracker.parent().findChild(nameAndLocation);
            assert(thisTracker);
            assert(thisTracker->isGeneratorTracker());
            tracker = std::static_pointer_cast<GeneratorTracker>(thisTracker);
        } else if (TestCaseTracking::ITrackerPtr childTracker =
                           currentTracker.findChild(nameAndLocation)) {
            assert(childTracker);
            assert(childTracker->isGeneratorTracker());
            tracker = std::static_pointer_cast<GeneratorTracker>(childTracker);
        } else {
            tracker = std::make_shared<GeneratorTracker>(nameAndLocation, ctx, &currentTracker);
            currentTracker.addChild(tracker);
        }

        if (!tracker->isComplete()) {
            tracker->open();
        }

        return *tracker;
    }

    // TrackerBase interface
    bool isGeneratorTracker() const override { return true; }
    auto hasGenerator() const -> bool override { return !!m_generator; }
    void close() override {
        TrackerBase::close();
        // If a generator has a child (it is followed by a section)
        // and none of its children have started, then we must wait
        // until later to start consuming its values.
        // This catches cases where `GENERATE` is placed between two
        // `SECTION`s.
        // **The check for m_children.empty cannot be removed**.
        // doing so would break `GENERATE` _not_ followed by `SECTION`s.
        const bool should_wait_for_child = [&]() {
            // No children -> nobody to wait for
            if (m_children.empty()) {
                return false;
            }
            // If at least one child started executing, don't wait
            if (std::find_if(m_children.begin(), m_children.end(),
                             [](TestCaseTracking::ITrackerPtr tracker) {
                                 return tracker->hasStarted();
                             }) != m_children.end()) {
                return false;
            }

            // No children have started. We need to check if they _can_
            // start, and thus we should wait for them, or they cannot
            // start (due to filters), and we shouldn't wait for them
            auto *parent = m_parent;
            // This is safe: there is always at least one section
            // tracker in a test case tracking tree
            while (!parent->isSectionTracker()) {
                parent = &(parent->parent());
            }
            assert(parent && "Missing root (test case) level section");

            auto const &parentSection = static_cast<SectionTracker &>(*parent);
            auto const &filters = parentSection.getFilters();
            // No filters -> no restrictions on running sections
            if (filters.empty()) {
                return true;
            }

            for (auto const &child : m_children) {
                if (child->isSectionTracker() &&
                    std::find(filters.begin(), filters.end(),
                              static_cast<SectionTracker &>(*child).trimmedName()) !=
                            filters.end()) {
                    return true;
                }
            }
            return false;
        }();

        // This check is a bit tricky, because m_generator->next()
        // has a side-effect, where it consumes generator's current
        // value, but we do not want to invoke the side-effect if
        // this generator is still waiting for any child to start.
        if (should_wait_for_child || (m_runState == CompletedSuccessfully && m_generator->next())) {
            m_children.clear();
            m_runState = Executing;
        }
    }

    // IGeneratorTracker interface
    auto getGenerator() const -> GeneratorBasePtr const & override { return m_generator; }
    void setGenerator(GeneratorBasePtr &&generator) override { m_generator = std::move(generator); }
};
GeneratorTracker::~GeneratorTracker() {}
}  // namespace Generators

RunContext::RunContext(IConfigPtr const &_config, IStreamingReporterPtr &&reporter)
        : m_runInfo(_config->name()),
          m_context(getCurrentMutableContext()),
          m_config(_config),
          m_reporter(std::move(reporter)),
          m_lastAssertionInfo{StringRef(), SourceLineInfo("", 0), StringRef(),
                              ResultDisposition::Normal},
          m_includeSuccessfulResults(m_config->includeSuccessfulResults() ||
                                     m_reporter->getPreferences().shouldReportAllAssertions) {
    m_context.setRunner(this);
    m_context.setConfig(m_config);
    m_context.setResultCapture(this);
    m_reporter->testRunStarting(m_runInfo);
}

RunContext::~RunContext() {
    m_reporter->testRunEnded(TestRunStats(m_runInfo, m_totals, aborting()));
}

void RunContext::testGroupStarting(std::string const &testSpec,
                                   std::size_t groupIndex,
                                   std::size_t groupsCount) {
    m_reporter->testGroupStarting(GroupInfo(testSpec, groupIndex, groupsCount));
}

void RunContext::testGroupEnded(std::string const &testSpec,
                                Totals const &totals,
                                std::size_t groupIndex,
                                std::size_t groupsCount) {
    m_reporter->testGroupEnded(
            TestGroupStats(GroupInfo(testSpec, groupIndex, groupsCount), totals, aborting()));
}

Totals RunContext::runTest(TestCase const &testCase) {
    Totals prevTotals = m_totals;

    std::string redirectedCout;
    std::string redirectedCerr;

    auto const &testInfo = testCase.getTestCaseInfo();

    m_reporter->testCaseStarting(testInfo);

    m_activeTestCase = &testCase;

    ITracker &rootTracker = m_trackerContext.startRun();
    assert(rootTracker.isSectionTracker());
    static_cast<SectionTracker &>(rootTracker).addInitialFilters(m_config->getSectionsToRun());
    do {
        m_trackerContext.startCycle();
        m_testCaseTracker = &SectionTracker::acquire(
                m_trackerContext,
                TestCaseTracking::NameAndLocation(testInfo.name, testInfo.lineInfo));
        runCurrentTest(redirectedCout, redirectedCerr);
    } while (!m_testCaseTracker->isSuccessfullyCompleted() && !aborting());

    Totals deltaTotals = m_totals.delta(prevTotals);
    if (testInfo.expectedToFail() && deltaTotals.testCases.passed > 0) {
        deltaTotals.assertions.failed++;
        deltaTotals.testCases.passed--;
        deltaTotals.testCases.failed++;
    }
    m_totals.testCases += deltaTotals.testCases;
    m_reporter->testCaseEnded(
            TestCaseStats(testInfo, deltaTotals, redirectedCout, redirectedCerr, aborting()));

    m_activeTestCase = nullptr;
    m_testCaseTracker = nullptr;

    return deltaTotals;
}

IConfigPtr RunContext::config() const { return m_config; }

IStreamingReporter &RunContext::reporter() const { return *m_reporter; }

void RunContext::assertionEnded(AssertionResult const &result) {
    if (result.getResultType() == ResultWas::Ok) {
        m_totals.assertions.passed++;
        m_lastAssertionPassed = true;
    } else if (!result.isOk()) {
        m_lastAssertionPassed = false;
        if (m_activeTestCase->getTestCaseInfo().okToFail())
            m_totals.assertions.failedButOk++;
        else
            m_totals.assertions.failed++;
    } else {
        m_lastAssertionPassed = true;
    }

    // We have no use for the return value (whether messages should be cleared),
    // because messages were made scoped and should be let to clear themselves
    // out.
    static_cast<void>(m_reporter->assertionEnded(AssertionStats(result, m_messages, m_totals)));

    if (result.getResultType() != ResultWas::Warning)
        m_messageScopes.clear();

    // Reset working state
    resetAssertionInfo();
    m_lastResult = result;
}
void RunContext::resetAssertionInfo() {
    m_lastAssertionInfo.macroName = StringRef();
    m_lastAssertionInfo.capturedExpression = "{Unknown expression after the reported line}"_sr;
}

bool RunContext::sectionStarted(SectionInfo const &sectionInfo, Counts &assertions) {
    ITracker &sectionTracker = SectionTracker::acquire(
            m_trackerContext,
            TestCaseTracking::NameAndLocation(sectionInfo.name, sectionInfo.lineInfo));
    if (!sectionTracker.isOpen())
        return false;
    m_activeSections.push_back(&sectionTracker);

    m_lastAssertionInfo.lineInfo = sectionInfo.lineInfo;

    m_reporter->sectionStarting(sectionInfo);

    assertions = m_totals.assertions;

    return true;
}
auto RunContext::acquireGeneratorTracker(StringRef generatorName, SourceLineInfo const &lineInfo)
        -> IGeneratorTracker & {
    using namespace Generators;
    GeneratorTracker &tracker = GeneratorTracker::acquire(
            m_trackerContext,
            TestCaseTracking::NameAndLocation(static_cast<std::string>(generatorName), lineInfo));
    m_lastAssertionInfo.lineInfo = lineInfo;
    return tracker;
}

bool RunContext::testForMissingAssertions(Counts &assertions) {
    if (assertions.total() != 0)
        return false;
    if (!m_config->warnAboutMissingAssertions())
        return false;
    if (m_trackerContext.currentTracker().hasChildren())
        return false;
    m_totals.assertions.failed++;
    assertions.failed++;
    return true;
}

void RunContext::sectionEnded(SectionEndInfo const &endInfo) {
    Counts assertions = m_totals.assertions - endInfo.prevAssertions;
    bool missingAssertions = testForMissingAssertions(assertions);

    if (!m_activeSections.empty()) {
        m_activeSections.back()->close();
        m_activeSections.pop_back();
    }

    m_reporter->sectionEnded(SectionStats(endInfo.sectionInfo, assertions,
                                          endInfo.durationInSeconds, missingAssertions));
    m_messages.clear();
    m_messageScopes.clear();
}

void RunContext::sectionEndedEarly(SectionEndInfo const &endInfo) {
    if (m_unfinishedSections.empty())
        m_activeSections.back()->fail();
    else
        m_activeSections.back()->close();
    m_activeSections.pop_back();

    m_unfinishedSections.push_back(endInfo);
}

#if defined(CATCH_CONFIG_ENABLE_BENCHMARKING)
void RunContext::benchmarkPreparing(std::string const &name) {
    m_reporter->benchmarkPreparing(name);
}
void RunContext::benchmarkStarting(BenchmarkInfo const &info) {
    m_reporter->benchmarkStarting(info);
}
void RunContext::benchmarkEnded(BenchmarkStats<> const &stats) {
    m_reporter->benchmarkEnded(stats);
}
void RunContext::benchmarkFailed(std::string const &error) { m_reporter->benchmarkFailed(error); }
#endif  // CATCH_CONFIG_ENABLE_BENCHMARKING

void RunContext::pushScopedMessage(MessageInfo const &message) { m_messages.push_back(message); }

void RunContext::popScopedMessage(MessageInfo const &message) {
    m_messages.erase(std::remove(m_messages.begin(), m_messages.end(), message), m_messages.end());
}

void RunContext::emplaceUnscopedMessage(MessageBuilder const &builder) {
    m_messageScopes.emplace_back(builder);
}

std::string RunContext::getCurrentTestName() const {
    return m_activeTestCase ? m_activeTestCase->getTestCaseInfo().name : std::string();
}

const AssertionResult *RunContext::getLastResult() const { return &(*m_lastResult); }

void RunContext::exceptionEarlyReported() { m_shouldReportUnexpected = false; }

void RunContext::handleFatalErrorCondition(StringRef message) {
    // First notify reporter that bad things happened
    m_reporter->fatalErrorEncountered(message);

    // Don't rebuild the result -- the stringification itself can cause more fatal
    // errors Instead, fake a result data.
    AssertionResultData tempResult(ResultWas::FatalErrorCondition, {false});
    tempResult.message = static_cast<std::string>(message);
    AssertionResult result(m_lastAssertionInfo, tempResult);

    assertionEnded(result);

    handleUnfinishedSections();

    // Recreate section for test case (as we will lose the one that was in scope)
    auto const &testCaseInfo = m_activeTestCase->getTestCaseInfo();
    SectionInfo testCaseSection(testCaseInfo.lineInfo, testCaseInfo.name);

    Counts assertions;
    assertions.failed = 1;
    SectionStats testCaseSectionStats(testCaseSection, assertions, 0, false);
    m_reporter->sectionEnded(testCaseSectionStats);

    auto const &testInfo = m_activeTestCase->getTestCaseInfo();

    Totals deltaTotals;
    deltaTotals.testCases.failed = 1;
    deltaTotals.assertions.failed = 1;
    m_reporter->testCaseEnded(
            TestCaseStats(testInfo, deltaTotals, std::string(), std::string(), false));
    m_totals.testCases.failed++;
    testGroupEnded(std::string(), m_totals, 1, 1);
    m_reporter->testRunEnded(TestRunStats(m_runInfo, m_totals, false));
}

bool RunContext::lastAssertionPassed() { return m_lastAssertionPassed; }

void RunContext::assertionPassed() {
    m_lastAssertionPassed = true;
    ++m_totals.assertions.passed;
    resetAssertionInfo();
    m_messageScopes.clear();
}

bool RunContext::aborting() const {
    return m_totals.assertions.failed >= static_cast<std::size_t>(m_config->abortAfter());
}

void RunContext::runCurrentTest(std::string &redirectedCout, std::string &redirectedCerr) {
    auto const &testCaseInfo = m_activeTestCase->getTestCaseInfo();
    SectionInfo testCaseSection(testCaseInfo.lineInfo, testCaseInfo.name);
    m_reporter->sectionStarting(testCaseSection);
    Counts prevAssertions = m_totals.assertions;
    double duration = 0;
    m_shouldReportUnexpected = true;
    m_lastAssertionInfo = {"TEST_CASE"_sr, testCaseInfo.lineInfo, StringRef(),
                           ResultDisposition::Normal};

    seedRng(*m_config);

    Timer timer;
    CATCH_TRY {
        if (m_reporter->getPreferences().shouldRedirectStdOut) {
#if !defined(CATCH_CONFIG_EXPERIMENTAL_REDIRECT)
            RedirectedStreams redirectedStreams(redirectedCout, redirectedCerr);

            timer.start();
            invokeActiveTestCase();
#else
            OutputRedirect r(redirectedCout, redirectedCerr);
            timer.start();
            invokeActiveTestCase();
#endif
        } else {
            timer.start();
            invokeActiveTestCase();
        }
        duration = timer.getElapsedSeconds();
    }
    CATCH_CATCH_ANON(TestFailureException &) {
        // This just means the test was aborted due to failure
    }
    CATCH_CATCH_ALL {
        // Under CATCH_CONFIG_FAST_COMPILE, unexpected exceptions under REQUIRE
        // assertions are reported without translation at the point of origin.
        if (m_shouldReportUnexpected) {
            AssertionReaction dummyReaction;
            handleUnexpectedInflightException(m_lastAssertionInfo, translateActiveException(),
                                              dummyReaction);
        }
    }
    Counts assertions = m_totals.assertions - prevAssertions;
    bool missingAssertions = testForMissingAssertions(assertions);

    m_testCaseTracker->close();
    handleUnfinishedSections();
    m_messages.clear();
    m_messageScopes.clear();

    SectionStats testCaseSectionStats(testCaseSection, assertions, duration, missingAssertions);
    m_reporter->sectionEnded(testCaseSectionStats);
}

void RunContext::invokeActiveTestCase() {
    FatalConditionHandlerGuard _(&m_fatalConditionhandler);
    m_activeTestCase->invoke();
}

void RunContext::handleUnfinishedSections() {
    // If sections ended prematurely due to an exception we stored their
    // infos here so we can tear them down outside the unwind process.
    for (auto it = m_unfinishedSections.rbegin(), itEnd = m_unfinishedSections.rend(); it != itEnd;
         ++it)
        sectionEnded(*it);
    m_unfinishedSections.clear();
}

void RunContext::handleExpr(AssertionInfo const &info,
                            ITransientExpression const &expr,
                            AssertionReaction &reaction) {
    m_reporter->assertionStarting(info);

    bool negated = isFalseTest(info.resultDisposition);
    bool result = expr.getResult() != negated;

    if (result) {
        if (!m_includeSuccessfulResults) {
            assertionPassed();
        } else {
            reportExpr(info, ResultWas::Ok, &expr, negated);
        }
    } else {
        reportExpr(info, ResultWas::ExpressionFailed, &expr, negated);
        populateReaction(reaction);
    }
}
void RunContext::reportExpr(AssertionInfo const &info,
                            ResultWas::OfType resultType,
                            ITransientExpression const *expr,
                            bool negated) {
    m_lastAssertionInfo = info;
    AssertionResultData data(resultType, LazyExpression(negated));

    AssertionResult assertionResult{info, data};
    assertionResult.m_resultData.lazyExpression.m_transientExpression = expr;

    assertionEnded(assertionResult);
}

void RunContext::handleMessage(AssertionInfo const &info,
                               ResultWas::OfType resultType,
                               StringRef const &message,
                               AssertionReaction &reaction) {
    m_reporter->assertionStarting(info);

    m_lastAssertionInfo = info;

    AssertionResultData data(resultType, LazyExpression(false));
    data.message = static_cast<std::string>(message);
    AssertionResult assertionResult{m_lastAssertionInfo, data};
    assertionEnded(assertionResult);
    if (!assertionResult.isOk())
        populateReaction(reaction);
}
void RunContext::handleUnexpectedExceptionNotThrown(AssertionInfo const &info,
                                                    AssertionReaction &reaction) {
    handleNonExpr(info, Catch::ResultWas::DidntThrowException, reaction);
}

void RunContext::handleUnexpectedInflightException(AssertionInfo const &info,
                                                   std::string const &message,
                                                   AssertionReaction &reaction) {
    m_lastAssertionInfo = info;

    AssertionResultData data(ResultWas::ThrewException, LazyExpression(false));
    data.message = message;
    AssertionResult assertionResult{info, data};
    assertionEnded(assertionResult);
    populateReaction(reaction);
}

void RunContext::populateReaction(AssertionReaction &reaction) {
    reaction.shouldDebugBreak = m_config->shouldDebugBreak();
    reaction.shouldThrow =
            aborting() || (m_lastAssertionInfo.resultDisposition & ResultDisposition::Normal);
}

void RunContext::handleIncomplete(AssertionInfo const &info) {
    m_lastAssertionInfo = info;

    AssertionResultData data(ResultWas::ThrewException, LazyExpression(false));
    data.message = "Exception translation was disabled by CATCH_CONFIG_FAST_COMPILE";
    AssertionResult assertionResult{info, data};
    assertionEnded(assertionResult);
}
void RunContext::handleNonExpr(AssertionInfo const &info,
                               ResultWas::OfType resultType,
                               AssertionReaction &reaction) {
    m_lastAssertionInfo = info;

    AssertionResultData data(resultType, LazyExpression(false));
    AssertionResult assertionResult{info, data};
    assertionEnded(assertionResult);

    if (!assertionResult.isOk())
        populateReaction(reaction);
}

IResultCapture &getResultCapture() {
    if (auto *capture = getCurrentContext().getResultCapture())
        return *capture;
    else
        CATCH_INTERNAL_ERROR("No result capture instance");
}

void seedRng(IConfig const &config) {
    if (config.rngSeed() != 0) {
        std::srand(config.rngSeed());
        rng().seed(config.rngSeed());
    }
}

unsigned int rngSeed() { return getCurrentContext().getConfig()->rngSeed(); }

}  // namespace Catch
// end catch_run_context.cpp
// start catch_section.cpp

namespace Catch {

Section::Section(SectionInfo const &info)
        : m_info(info), m_sectionIncluded(getResultCapture().sectionStarted(m_info, m_assertions)) {
    m_timer.start();
}

Section::~Section() {
    if (m_sectionIncluded) {
        SectionEndInfo endInfo{m_info, m_assertions, m_timer.getElapsedSeconds()};
        if (uncaught_exceptions())
            getResultCapture().sectionEndedEarly(endInfo);
        else
            getResultCapture().sectionEnded(endInfo);
    }
}

// This indicates whether the section should be executed or not
Section::operator bool() const { return m_sectionIncluded; }

}  // end namespace Catch
// end catch_section.cpp
// start catch_section_info.cpp

namespace Catch {

SectionInfo::SectionInfo(SourceLineInfo const &_lineInfo, std::string const &_name)
        : name(_name), lineInfo(_lineInfo) {}

}  // end namespace Catch
// end catch_section_info.cpp
// start catch_session.cpp

// start catch_session.h

#include <memory>

namespace Catch {

class Session : NonCopyable {
public:
    Session();
    ~Session() override;

    void showHelp() const;
    void libIdentify();

    int applyCommandLine(int argc, char const *const *argv);
#if defined(CATCH_CONFIG_WCHAR) && defined(_WIN32) && defined(UNICODE)
    int applyCommandLine(int argc, wchar_t const *const *argv);
#endif

    void useConfigData(ConfigData const &configData);

    template <typename CharT>
    int run(int argc, CharT const *const argv[]) {
        if (m_startupExceptions)
            return 1;
        int returnCode = applyCommandLine(argc, argv);
        if (returnCode == 0)
            returnCode = run();
        return returnCode;
    }

    int run();

    clara::Parser const &cli() const;
    void cli(clara::Parser const &newParser);
    ConfigData &configData();
    Config &config();

private:
    int runInternal();

    clara::Parser m_cli;
    ConfigData m_configData;
    std::shared_ptr<Config> m_config;
    bool m_startupExceptions = false;
};

}  // end namespace Catch

// end catch_session.h
// start catch_version.h

#include <iosfwd>

namespace Catch {

// Versioning information
struct Version {
    Version(Version const &) = delete;
    Version &operator=(Version const &) = delete;
    Version(unsigned int _majorVersion,
            unsigned int _minorVersion,
            unsigned int _patchNumber,
            char const *const _branchName,
            unsigned int _buildNumber);

    unsigned int const majorVersion;
    unsigned int const minorVersion;
    unsigned int const patchNumber;

    // buildNumber is only used if branchName is not null
    char const *const branchName;
    unsigned int const buildNumber;

    friend std::ostream &operator<<(std::ostream &os, Version const &version);
};

Version const &libraryVersion();
}  // namespace Catch

// end catch_version.h
#include <cstdlib>
#include <iomanip>
#include <iterator>
#include <set>

namespace Catch {

namespace {
const int MaxExitCode = 255;

IStreamingReporterPtr createReporter(std::string const &reporterName, IConfigPtr const &config) {
    auto reporter = Catch::getRegistryHub().getReporterRegistry().create(reporterName, config);
    CATCH_ENFORCE(reporter, "No reporter registered with name: '" << reporterName << "'");

    return reporter;
}

IStreamingReporterPtr makeReporter(std::shared_ptr<Config> const &config) {
    if (Catch::getRegistryHub().getReporterRegistry().getListeners().empty()) {
        return createReporter(config->getReporterName(), config);
    }

    // On older platforms, returning std::unique_ptr<ListeningReporter>
    // when the return type is std::unique_ptr<IStreamingReporter>
    // doesn't compile without a std::move call. However, this causes
    // a warning on newer platforms. Thus, we have to work around
    // it a bit and downcast the pointer manually.
    auto ret = std::unique_ptr<IStreamingReporter>(new ListeningReporter);
    auto &multi = static_cast<ListeningReporter &>(*ret);
    auto const &listeners = Catch::getRegistryHub().getReporterRegistry().getListeners();
    for (auto const &listener : listeners) {
        multi.addListener(listener->create(Catch::ReporterConfig(config)));
    }
    multi.addReporter(createReporter(config->getReporterName(), config));
    return ret;
}

class TestGroup {
public:
    explicit TestGroup(std::shared_ptr<Config> const &config)
            : m_config{config}, m_context{config, makeReporter(config)} {
        auto const &allTestCases = getAllTestCasesSorted(*m_config);
        m_matches = m_config->testSpec().matchesByFilter(allTestCases, *m_config);
        auto const &invalidArgs = m_config->testSpec().getInvalidArgs();

        if (m_matches.empty() && invalidArgs.empty()) {
            for (auto const &test : allTestCases)
                if (!test.isHidden())
                    m_tests.emplace(&test);
        } else {
            for (auto const &match : m_matches)
                m_tests.insert(match.tests.begin(), match.tests.end());
        }
    }

    Totals execute() {
        auto const &invalidArgs = m_config->testSpec().getInvalidArgs();
        Totals totals;
        m_context.testGroupStarting(m_config->name(), 1, 1);
        for (auto const &testCase : m_tests) {
            if (!m_context.aborting())
                totals += m_context.runTest(*testCase);
            else
                m_context.reporter().skipTest(*testCase);
        }

        for (auto const &match : m_matches) {
            if (match.tests.empty()) {
                m_context.reporter().noMatchingTestCases(match.name);
                totals.error = -1;
            }
        }

        if (!invalidArgs.empty()) {
            for (auto const &invalidArg : invalidArgs)
                m_context.reporter().reportInvalidArguments(invalidArg);
        }

        m_context.testGroupEnded(m_config->name(), totals, 1, 1);
        return totals;
    }

private:
    using Tests = std::set<TestCase const *>;

    std::shared_ptr<Config> m_config;
    RunContext m_context;
    Tests m_tests;
    TestSpec::Matches m_matches;
};

void applyFilenamesAsTags(Catch::IConfig const &config) {
    auto &tests = const_cast<std::vector<TestCase> &>(getAllTestCasesSorted(config));
    for (auto &testCase : tests) {
        auto tags = testCase.tags;

        std::string filename = testCase.lineInfo.file;
        auto lastSlash = filename.find_last_of("\\/");
        if (lastSlash != std::string::npos) {
            filename.erase(0, lastSlash);
            filename[0] = '#';
        }

        auto lastDot = filename.find_last_of('.');
        if (lastDot != std::string::npos) {
            filename.erase(lastDot);
        }

        tags.push_back(std::move(filename));
        setTags(testCase, tags);
    }
}

}  // namespace

Session::Session() {
    static bool alreadyInstantiated = false;
    if (alreadyInstantiated) {
        CATCH_TRY { CATCH_INTERNAL_ERROR("Only one instance of Catch::Session can ever be used"); }
        CATCH_CATCH_ALL { getMutableRegistryHub().registerStartupException(); }
    }

    // There cannot be exceptions at startup in no-exception mode.
#if !defined(CATCH_CONFIG_DISABLE_EXCEPTIONS)
    const auto &exceptions = getRegistryHub().getStartupExceptionRegistry().getExceptions();
    if (!exceptions.empty()) {
        config();
        getCurrentMutableContext().setConfig(m_config);

        m_startupExceptions = true;
        Colour colourGuard(Colour::Red);
        Catch::cerr() << "Errors occurred during startup!" << '\n';
        // iterate over all exceptions and notify user
        for (const auto &ex_ptr : exceptions) {
            try {
                std::rethrow_exception(ex_ptr);
            } catch (std::exception const &ex) {
                Catch::cerr() << Column(ex.what()).indent(2) << '\n';
            }
        }
    }
#endif

    alreadyInstantiated = true;
    m_cli = makeCommandLineParser(m_configData);
}
Session::~Session() { Catch::cleanUp(); }

void Session::showHelp() const {
    Catch::cout() << "\nCatch v" << libraryVersion() << "\n"
                  << m_cli << std::endl
                  << "For more detailed usage please see the project docs\n"
                  << std::endl;
}
void Session::libIdentify() {
    Catch::cout() << std::left << std::setw(16) << "description: "
                  << "A Catch2 test executable\n"
                  << std::left << std::setw(16) << "category: "
                  << "testframework\n"
                  << std::left << std::setw(16) << "framework: "
                  << "Catch Test\n"
                  << std::left << std::setw(16) << "version: " << libraryVersion() << std::endl;
}

int Session::applyCommandLine(int argc, char const *const *argv) {
    if (m_startupExceptions)
        return 1;

    auto result = m_cli.parse(clara::Args(argc, argv));
    if (!result) {
        config();
        getCurrentMutableContext().setConfig(m_config);
        Catch::cerr() << Colour(Colour::Red) << "\nError(s) in input:\n"
                      << Column(result.errorMessage()).indent(2) << "\n\n";
        Catch::cerr() << "Run with -? for usage\n" << std::endl;
        return MaxExitCode;
    }

    if (m_configData.showHelp)
        showHelp();
    if (m_configData.libIdentify)
        libIdentify();
    m_config.reset();
    return 0;
}

#if defined(CATCH_CONFIG_WCHAR) && defined(_WIN32) && defined(UNICODE)
int Session::applyCommandLine(int argc, wchar_t const *const *argv) {
    char **utf8Argv = new char *[argc];

    for (int i = 0; i < argc; ++i) {
        int bufSize = WideCharToMultiByte(CP_UTF8, 0, argv[i], -1, nullptr, 0, nullptr, nullptr);

        utf8Argv[i] = new char[bufSize];

        WideCharToMultiByte(CP_UTF8, 0, argv[i], -1, utf8Argv[i], bufSize, nullptr, nullptr);
    }

    int returnCode = applyCommandLine(argc, utf8Argv);

    for (int i = 0; i < argc; ++i)
        delete[] utf8Argv[i];

    delete[] utf8Argv;

    return returnCode;
}
#endif

void Session::useConfigData(ConfigData const &configData) {
    m_configData = configData;
    m_config.reset();
}

int Session::run() {
    if ((m_configData.waitForKeypress & WaitForKeypress::BeforeStart) != 0) {
        Catch::cout() << "...waiting for enter/ return before starting" << std::endl;
        static_cast<void>(std::getchar());
    }
    int exitCode = runInternal();
    if ((m_configData.waitForKeypress & WaitForKeypress::BeforeExit) != 0) {
        Catch::cout() << "...waiting for enter/ return before exiting, with code: " << exitCode
                      << std::endl;
        static_cast<void>(std::getchar());
    }
    return exitCode;
}

clara::Parser const &Session::cli() const { return m_cli; }
void Session::cli(clara::Parser const &newParser) { m_cli = newParser; }
ConfigData &Session::configData() { return m_configData; }
Config &Session::config() {
    if (!m_config)
        m_config = std::make_shared<Config>(m_configData);
    return *m_config;
}

int Session::runInternal() {
    if (m_startupExceptions)
        return 1;

    if (m_configData.showHelp || m_configData.libIdentify) {
        return 0;
    }

    CATCH_TRY {
        config();  // Force config to be constructed

        seedRng(*m_config);

        if (m_configData.filenamesAsTags)
            applyFilenamesAsTags(*m_config);

        // Handle list request
        if (Option<std::size_t> listed = list(m_config))
            return static_cast<int>(*listed);

        TestGroup tests{m_config};
        auto const totals = tests.execute();

        if (m_config->warnAboutNoTests() && totals.error == -1)
            return 2;

        // Note that on unices only the lower 8 bits are usually used, clamping
        // the return value to 255 prevents false negative when some multiple
        // of 256 tests has failed
        return (std::min)(MaxExitCode,
                          (std::max)(totals.error, static_cast<int>(totals.assertions.failed)));
    }
#if !defined(CATCH_CONFIG_DISABLE_EXCEPTIONS)
    catch (std::exception &ex) {
        Catch::cerr() << ex.what() << std::endl;
        return MaxExitCode;
    }
#endif
}

}  // end namespace Catch
// end catch_session.cpp
// start catch_singletons.cpp

#include <vector>

namespace Catch {

namespace {
static auto getSingletons() -> std::vector<ISingleton *> *& {
    static std::vector<ISingleton *> *g_singletons = nullptr;
    if (!g_singletons)
        g_singletons = new std::vector<ISingleton *>();
    return g_singletons;
}
}  // namespace

ISingleton::~ISingleton() {}

void addSingleton(ISingleton *singleton) { getSingletons()->push_back(singleton); }
void cleanupSingletons() {
    auto &singletons = getSingletons();
    for (auto singleton : *singletons)
        delete singleton;
    delete singletons;
    singletons = nullptr;
}

}  // namespace Catch
// end catch_singletons.cpp
// start catch_startup_exception_registry.cpp

#if !defined(CATCH_CONFIG_DISABLE_EXCEPTIONS)
namespace Catch {
void StartupExceptionRegistry::add(std::exception_ptr const &exception) noexcept {
    CATCH_TRY { m_exceptions.push_back(exception); }
    CATCH_CATCH_ALL {
        // If we run out of memory during start-up there's really not a lot more we
        // can do about it
        std::terminate();
    }
}

std::vector<std::exception_ptr> const &StartupExceptionRegistry::getExceptions() const noexcept {
    return m_exceptions;
}

}  // end namespace Catch
#endif
// end catch_startup_exception_registry.cpp
// start catch_stream.cpp

#include <cstdio>
#include <fstream>
#include <iostream>
#include <memory>
#include <sstream>
#include <vector>

namespace Catch {

Catch::IStream::~IStream() = default;

namespace Detail {
namespace {
template <typename WriterF, std::size_t bufferSize = 256>
class StreamBufImpl : public std::streambuf {
    char data[bufferSize];
    WriterF m_writer;

public:
    StreamBufImpl() { setp(data, data + sizeof(data)); }

    ~StreamBufImpl() noexcept { StreamBufImpl::sync(); }

private:
    int overflow(int c) override {
        sync();

        if (c != EOF) {
            if (pbase() == epptr())
                m_writer(std::string(1, static_cast<char>(c)));
            else
                sputc(static_cast<char>(c));
        }
        return 0;
    }

    int sync() override {
        if (pbase() != pptr()) {
            m_writer(std::string(pbase(), static_cast<std::string::size_type>(pptr() - pbase())));
            setp(pbase(), epptr());
        }
        return 0;
    }
};

///////////////////////////////////////////////////////////////////////////

struct OutputDebugWriter {
    void operator()(std::string const &str) { writeToDebugConsole(str); }
};

///////////////////////////////////////////////////////////////////////////

class FileStream : public IStream {
    mutable std::ofstream m_ofs;

public:
    FileStream(StringRef filename) {
        m_ofs.open(filename.c_str());
        CATCH_ENFORCE(!m_ofs.fail(), "Unable to open file: '" << filename << "'");
    }
    ~FileStream() override = default;

public:  // IStream
    std::ostream &stream() const override { return m_ofs; }
};

///////////////////////////////////////////////////////////////////////////

class CoutStream : public IStream {
    mutable std::ostream m_os;

public:
    // Store the streambuf from cout up-front because
    // cout may get redirected when running tests
    CoutStream() : m_os(Catch::cout().rdbuf()) {}
    ~CoutStream() override = default;

public:  // IStream
    std::ostream &stream() const override { return m_os; }
};

///////////////////////////////////////////////////////////////////////////

class DebugOutStream : public IStream {
    std::unique_ptr<StreamBufImpl<OutputDebugWriter>> m_streamBuf;
    mutable std::ostream m_os;

public:
    DebugOutStream()
            : m_streamBuf(new StreamBufImpl<OutputDebugWriter>()), m_os(m_streamBuf.get()) {}

    ~DebugOutStream() override = default;

public:  // IStream
    std::ostream &stream() const override { return m_os; }
};

}  // namespace
}  // namespace Detail

///////////////////////////////////////////////////////////////////////////

auto makeStream(StringRef const &filename) -> IStream const * {
    if (filename.empty())
        return new Detail::CoutStream();
    else if (filename[0] == '%') {
        if (filename == "%debug")
            return new Detail::DebugOutStream();
        else
            CATCH_ERROR("Unrecognised stream: '" << filename << "'");
    } else
        return new Detail::FileStream(filename);
}

// This class encapsulates the idea of a pool of ostringstreams that can be
// reused.
struct StringStreams {
    std::vector<std::unique_ptr<std::ostringstream>> m_streams;
    std::vector<std::size_t> m_unused;
    std::ostringstream m_referenceStream;  // Used for copy state/ flags from

    auto add() -> std::size_t {
        if (m_unused.empty()) {
            m_streams.push_back(std::unique_ptr<std::ostringstream>(new std::ostringstream));
            return m_streams.size() - 1;
        } else {
            auto index = m_unused.back();
            m_unused.pop_back();
            return index;
        }
    }

    void release(std::size_t index) {
        m_streams[index]->copyfmt(m_referenceStream);  // Restore initial flags and other state
        m_unused.push_back(index);
    }
};

ReusableStringStream::ReusableStringStream()
        : m_index(Singleton<StringStreams>::getMutable().add()),
          m_oss(Singleton<StringStreams>::getMutable().m_streams[m_index].get()) {}

ReusableStringStream::~ReusableStringStream() {
    static_cast<std::ostringstream *>(m_oss)->str("");
    m_oss->clear();
    Singleton<StringStreams>::getMutable().release(m_index);
}

auto ReusableStringStream::str() const -> std::string {
    return static_cast<std::ostringstream *>(m_oss)->str();
}

///////////////////////////////////////////////////////////////////////////

#ifndef CATCH_CONFIG_NOSTDOUT  // If you #define this you must implement these \
                               // functions
std::ostream &cout() { return std::cout; }
std::ostream &cerr() { return std::cerr; }
std::ostream &clog() { return std::clog; }
#endif
}  // namespace Catch
// end catch_stream.cpp
// start catch_string_manip.cpp

#include <algorithm>
#include <cctype>
#include <cstring>
#include <ostream>
#include <vector>

namespace Catch {

namespace {
char toLowerCh(char c) { return static_cast<char>(std::tolower(static_cast<unsigned char>(c))); }
}  // namespace

bool startsWith(std::string const &s, std::string const &prefix) {
    return s.size() >= prefix.size() && std::equal(prefix.begin(), prefix.end(), s.begin());
}
bool startsWith(std::string const &s, char prefix) { return !s.empty() && s[0] == prefix; }
bool endsWith(std::string const &s, std::string const &suffix) {
    return s.size() >= suffix.size() && std::equal(suffix.rbegin(), suffix.rend(), s.rbegin());
}
bool endsWith(std::string const &s, char suffix) { return !s.empty() && s[s.size() - 1] == suffix; }
bool contains(std::string const &s, std::string const &infix) {
    return s.find(infix) != std::string::npos;
}
void toLowerInPlace(std::string &s) { std::transform(s.begin(), s.end(), s.begin(), toLowerCh); }
std::string toLower(std::string const &s) {
    std::string lc = s;
    toLowerInPlace(lc);
    return lc;
}
std::string trim(std::string const &str) {
    static char const *whitespaceChars = "\n\r\t ";
    std::string::size_type start = str.find_first_not_of(whitespaceChars);
    std::string::size_type end = str.find_last_not_of(whitespaceChars);

    return start != std::string::npos ? str.substr(start, 1 + end - start) : std::string();
}

StringRef trim(StringRef ref) {
    const auto is_ws = [](char c) { return c == ' ' || c == '\t' || c == '\n' || c == '\r'; };
    size_t real_begin = 0;
    while (real_begin < ref.size() && is_ws(ref[real_begin])) {
        ++real_begin;
    }
    size_t real_end = ref.size();
    while (real_end > real_begin && is_ws(ref[real_end - 1])) {
        --real_end;
    }

    return ref.substr(real_begin, real_end - real_begin);
}

bool replaceInPlace(std::string &str, std::string const &replaceThis, std::string const &withThis) {
    bool replaced = false;
    std::size_t i = str.find(replaceThis);
    while (i != std::string::npos) {
        replaced = true;
        str = str.substr(0, i) + withThis + str.substr(i + replaceThis.size());
        if (i < str.size() - withThis.size())
            i = str.find(replaceThis, i + withThis.size());
        else
            i = std::string::npos;
    }
    return replaced;
}

std::vector<StringRef> splitStringRef(StringRef str, char delimiter) {
    std::vector<StringRef> subStrings;
    std::size_t start = 0;
    for (std::size_t pos = 0; pos < str.size(); ++pos) {
        if (str[pos] == delimiter) {
            if (pos - start > 1)
                subStrings.push_back(str.substr(start, pos - start));
            start = pos + 1;
        }
    }
    if (start < str.size())
        subStrings.push_back(str.substr(start, str.size() - start));
    return subStrings;
}

pluralise::pluralise(std::size_t count, std::string const &label)
        : m_count(count), m_label(label) {}

std::ostream &operator<<(std::ostream &os, pluralise const &pluraliser) {
    os << pluraliser.m_count << ' ' << pluraliser.m_label;
    if (pluraliser.m_count != 1)
        os << 's';
    return os;
}

}  // namespace Catch
// end catch_string_manip.cpp
// start catch_stringref.cpp

#include <algorithm>
#include <cstdint>
#include <cstring>
#include <ostream>

namespace Catch {
StringRef::StringRef(char const *rawChars) noexcept
        : StringRef(rawChars, static_cast<StringRef::size_type>(std::strlen(rawChars))) {}

auto StringRef::c_str() const -> char const * {
    CATCH_ENFORCE(isNullTerminated(),
                  "Called StringRef::c_str() on a non-null-terminated instance");
    return m_start;
}
auto StringRef::data() const noexcept -> char const * { return m_start; }

auto StringRef::substr(size_type start, size_type size) const noexcept -> StringRef {
    if (start < m_size) {
        return StringRef(m_start + start, (std::min)(m_size - start, size));
    } else {
        return StringRef();
    }
}
auto StringRef::operator==(StringRef const &other) const noexcept -> bool {
    return m_size == other.m_size && (std::memcmp(m_start, other.m_start, m_size) == 0);
}

auto operator<<(std::ostream &os, StringRef const &str) -> std::ostream & {
    return os.write(str.data(), str.size());
}

auto operator+=(std::string &lhs, StringRef const &rhs) -> std::string & {
    lhs.append(rhs.data(), rhs.size());
    return lhs;
}

}  // namespace Catch
// end catch_stringref.cpp
// start catch_tag_alias.cpp

namespace Catch {
TagAlias::TagAlias(std::string const &_tag, SourceLineInfo _lineInfo)
        : tag(_tag), lineInfo(_lineInfo) {}
}  // namespace Catch
// end catch_tag_alias.cpp
// start catch_tag_alias_autoregistrar.cpp

namespace Catch {

RegistrarForTagAliases::RegistrarForTagAliases(char const *alias,
                                               char const *tag,
                                               SourceLineInfo const &lineInfo) {
    CATCH_TRY { getMutableRegistryHub().registerTagAlias(alias, tag, lineInfo); }
    CATCH_CATCH_ALL {
        // Do not throw when constructing global objects, instead register the
        // exception to be processed later
        getMutableRegistryHub().registerStartupException();
    }
}

}  // namespace Catch
// end catch_tag_alias_autoregistrar.cpp
// start catch_tag_alias_registry.cpp

#include <sstream>

namespace Catch {

TagAliasRegistry::~TagAliasRegistry() {}

TagAlias const *TagAliasRegistry::find(std::string const &alias) const {
    auto it = m_registry.find(alias);
    if (it != m_registry.end())
        return &(it->second);
    else
        return nullptr;
}

std::string TagAliasRegistry::expandAliases(std::string const &unexpandedTestSpec) const {
    std::string expandedTestSpec = unexpandedTestSpec;
    for (auto const &registryKvp : m_registry) {
        std::size_t pos = expandedTestSpec.find(registryKvp.first);
        if (pos != std::string::npos) {
            expandedTestSpec = expandedTestSpec.substr(0, pos) + registryKvp.second.tag +
                               expandedTestSpec.substr(pos + registryKvp.first.size());
        }
    }
    return expandedTestSpec;
}

void TagAliasRegistry::add(std::string const &alias,
                           std::string const &tag,
                           SourceLineInfo const &lineInfo) {
    CATCH_ENFORCE(startsWith(alias, "[@") && endsWith(alias, ']'),
                  "error: tag alias, '" << alias << "' is not of the form [@alias name].\n"
                                        << lineInfo);

    CATCH_ENFORCE(m_registry.insert(std::make_pair(alias, TagAlias(tag, lineInfo))).second,
                  "error: tag alias, '" << alias << "' already registered.\n"
                                        << "\tFirst seen at: " << find(alias)->lineInfo << "\n"
                                        << "\tRedefined at: " << lineInfo);
}

ITagAliasRegistry::~ITagAliasRegistry() {}

ITagAliasRegistry const &ITagAliasRegistry::get() { return getRegistryHub().getTagAliasRegistry(); }

}  // end namespace Catch
// end catch_tag_alias_registry.cpp
// start catch_test_case_info.cpp

#include <algorithm>
#include <cctype>
#include <exception>
#include <sstream>

namespace Catch {

namespace {
TestCaseInfo::SpecialProperties parseSpecialTag(std::string const &tag) {
    if (startsWith(tag, '.') || tag == "!hide")
        return TestCaseInfo::IsHidden;
    else if (tag == "!throws")
        return TestCaseInfo::Throws;
    else if (tag == "!shouldfail")
        return TestCaseInfo::ShouldFail;
    else if (tag == "!mayfail")
        return TestCaseInfo::MayFail;
    else if (tag == "!nonportable")
        return TestCaseInfo::NonPortable;
    else if (tag == "!benchmark")
        return static_cast<TestCaseInfo::SpecialProperties>(TestCaseInfo::Benchmark |
                                                            TestCaseInfo::IsHidden);
    else
        return TestCaseInfo::None;
}
bool isReservedTag(std::string const &tag) {
    return parseSpecialTag(tag) == TestCaseInfo::None && tag.size() > 0 &&
           !std::isalnum(static_cast<unsigned char>(tag[0]));
}
void enforceNotReservedTag(std::string const &tag, SourceLineInfo const &_lineInfo) {
    CATCH_ENFORCE(!isReservedTag(tag), "Tag name: [" << tag << "] is not allowed.\n"
                                                     << "Tag names starting with non alphanumeric "
                                                        "characters are reserved\n"
                                                     << _lineInfo);
}
}  // namespace

TestCase makeTestCase(ITestInvoker *_testCase,
                      std::string const &_className,
                      NameAndTags const &nameAndTags,
                      SourceLineInfo const &_lineInfo) {
    bool isHidden = false;

    // Parse out tags
    std::vector<std::string> tags;
    std::string desc, tag;
    bool inTag = false;
    for (char c : nameAndTags.tags) {
        if (!inTag) {
            if (c == '[')
                inTag = true;
            else
                desc += c;
        } else {
            if (c == ']') {
                TestCaseInfo::SpecialProperties prop = parseSpecialTag(tag);
                if ((prop & TestCaseInfo::IsHidden) != 0)
                    isHidden = true;
                else if (prop == TestCaseInfo::None)
                    enforceNotReservedTag(tag, _lineInfo);

                // Merged hide tags like `[.approvals]` should be added as
                // `[.][approvals]`. The `[.]` is added at later point, so
                // we only strip the prefix
                if (startsWith(tag, '.') && tag.size() > 1) {
                    tag.erase(0, 1);
                }
                tags.push_back(tag);
                tag.clear();
                inTag = false;
            } else
                tag += c;
        }
    }
    if (isHidden) {
        // Add all "hidden" tags to make them behave identically
        tags.insert(tags.end(), {".", "!hide"});
    }

    TestCaseInfo info(static_cast<std::string>(nameAndTags.name), _className, desc, tags,
                      _lineInfo);
    return TestCase(_testCase, std::move(info));
}

void setTags(TestCaseInfo &testCaseInfo, std::vector<std::string> tags) {
    std::sort(begin(tags), end(tags));
    tags.erase(std::unique(begin(tags), end(tags)), end(tags));
    testCaseInfo.lcaseTags.clear();

    for (auto const &tag : tags) {
        std::string lcaseTag = toLower(tag);
        testCaseInfo.properties = static_cast<TestCaseInfo::SpecialProperties>(
                testCaseInfo.properties | parseSpecialTag(lcaseTag));
        testCaseInfo.lcaseTags.push_back(lcaseTag);
    }
    testCaseInfo.tags = std::move(tags);
}

TestCaseInfo::TestCaseInfo(std::string const &_name,
                           std::string const &_className,
                           std::string const &_description,
                           std::vector<std::string> const &_tags,
                           SourceLineInfo const &_lineInfo)
        : name(_name),
          className(_className),
          description(_description),
          lineInfo(_lineInfo),
          properties(None) {
    setTags(*this, _tags);
}

bool TestCaseInfo::isHidden() const { return (properties & IsHidden) != 0; }
bool TestCaseInfo::throws() const { return (properties & Throws) != 0; }
bool TestCaseInfo::okToFail() const { return (properties & (ShouldFail | MayFail)) != 0; }
bool TestCaseInfo::expectedToFail() const { return (properties & (ShouldFail)) != 0; }

std::string TestCaseInfo::tagsAsString() const {
    std::string ret;
    // '[' and ']' per tag
    std::size_t full_size = 2 * tags.size();
    for (const auto &tag : tags) {
        full_size += tag.size();
    }
    ret.reserve(full_size);
    for (const auto &tag : tags) {
        ret.push_back('[');
        ret.append(tag);
        ret.push_back(']');
    }

    return ret;
}

TestCase::TestCase(ITestInvoker *testCase, TestCaseInfo &&info)
        : TestCaseInfo(std::move(info)), test(testCase) {}

TestCase TestCase::withName(std::string const &_newName) const {
    TestCase other(*this);
    other.name = _newName;
    return other;
}

void TestCase::invoke() const { test->invoke(); }

bool TestCase::operator==(TestCase const &other) const {
    return test.get() == other.test.get() && name == other.name && className == other.className;
}

bool TestCase::operator<(TestCase const &other) const { return name < other.name; }

TestCaseInfo const &TestCase::getTestCaseInfo() const { return *this; }

}  // end namespace Catch
// end catch_test_case_info.cpp
// start catch_test_case_registry_impl.cpp

#include <algorithm>
#include <sstream>

namespace Catch {

namespace {
struct TestHasher {
    using hash_t = uint64_t;

    explicit TestHasher(hash_t hashSuffix) : m_hashSuffix{hashSuffix} {}

    uint32_t operator()(TestCase const &t) const {
        // FNV-1a hash with multiplication fold.
        const hash_t prime = 1099511628211u;
        hash_t hash = 14695981039346656037u;
        for (const char c : t.name) {
            hash ^= c;
            hash *= prime;
        }
        hash ^= m_hashSuffix;
        hash *= prime;
        const uint32_t low{static_cast<uint32_t>(hash)};
        const uint32_t high{static_cast<uint32_t>(hash >> 32)};
        return low * high;
    }

private:
    hash_t m_hashSuffix;
};
}  // end unnamed namespace

std::vector<TestCase> sortTests(IConfig const &config,
                                std::vector<TestCase> const &unsortedTestCases) {
    switch (config.runOrder()) {
    case RunTests::InDeclarationOrder:
        // already in declaration order
        break;

    case RunTests::InLexicographicalOrder: {
        std::vector<TestCase> sorted = unsortedTestCases;
        std::sort(sorted.begin(), sorted.end());
        return sorted;
    }

    case RunTests::InRandomOrder: {
        seedRng(config);
        TestHasher h{config.rngSeed()};

        using hashedTest = std::pair<TestHasher::hash_t, TestCase const *>;
        std::vector<hashedTest> indexed_tests;
        indexed_tests.reserve(unsortedTestCases.size());

        for (auto const &testCase : unsortedTestCases) {
            indexed_tests.emplace_back(h(testCase), &testCase);
        }

        std::sort(indexed_tests.begin(), indexed_tests.end(),
                  [](hashedTest const &lhs, hashedTest const &rhs) {
                      if (lhs.first == rhs.first) {
                          return lhs.second->name < rhs.second->name;
                      }
                      return lhs.first < rhs.first;
                  });

        std::vector<TestCase> sorted;
        sorted.reserve(indexed_tests.size());

        for (auto const &hashed : indexed_tests) {
            sorted.emplace_back(*hashed.second);
        }

        return sorted;
    }
    }
    return unsortedTestCases;
}

bool isThrowSafe(TestCase const &testCase, IConfig const &config) {
    return !testCase.throws() || config.allowThrows();
}

bool matchTest(TestCase const &testCase, TestSpec const &testSpec, IConfig const &config) {
    return testSpec.matches(testCase) && isThrowSafe(testCase, config);
}

void enforceNoDuplicateTestCases(std::vector<TestCase> const &functions) {
    std::set<TestCase> seenFunctions;
    for (auto const &function : functions) {
        auto prev = seenFunctions.insert(function);
        CATCH_ENFORCE(prev.second, "error: TEST_CASE( \""
                                           << function.name << "\" ) already defined.\n"
                                           << "\tFirst seen at "
                                           << prev.first->getTestCaseInfo().lineInfo << "\n"
                                           << "\tRedefined at "
                                           << function.getTestCaseInfo().lineInfo);
    }
}

std::vector<TestCase> filterTests(std::vector<TestCase> const &testCases,
                                  TestSpec const &testSpec,
                                  IConfig const &config) {
    std::vector<TestCase> filtered;
    filtered.reserve(testCases.size());
    for (auto const &testCase : testCases) {
        if ((!testSpec.hasFilters() && !testCase.isHidden()) ||
            (testSpec.hasFilters() && matchTest(testCase, testSpec, config))) {
            filtered.push_back(testCase);
        }
    }
    return filtered;
}
std::vector<TestCase> const &getAllTestCasesSorted(IConfig const &config) {
    return getRegistryHub().getTestCaseRegistry().getAllTestsSorted(config);
}

void TestRegistry::registerTest(TestCase const &testCase) {
    std::string name = testCase.getTestCaseInfo().name;
    if (name.empty()) {
        ReusableStringStream rss;
        rss << "Anonymous test case " << ++m_unnamedCount;
        return registerTest(testCase.withName(rss.str()));
    }
    m_functions.push_back(testCase);
}

std::vector<TestCase> const &TestRegistry::getAllTests() const { return m_functions; }
std::vector<TestCase> const &TestRegistry::getAllTestsSorted(IConfig const &config) const {
    if (m_sortedFunctions.empty())
        enforceNoDuplicateTestCases(m_functions);

    if (m_currentSortOrder != config.runOrder() || m_sortedFunctions.empty()) {
        m_sortedFunctions = sortTests(config, m_functions);
        m_currentSortOrder = config.runOrder();
    }
    return m_sortedFunctions;
}

///////////////////////////////////////////////////////////////////////////
TestInvokerAsFunction::TestInvokerAsFunction(void (*testAsFunction)()) noexcept
        : m_testAsFunction(testAsFunction) {}

void TestInvokerAsFunction::invoke() const { m_testAsFunction(); }

std::string extractClassName(StringRef const &classOrQualifiedMethodName) {
    std::string className(classOrQualifiedMethodName);
    if (startsWith(className, '&')) {
        std::size_t lastColons = className.rfind("::");
        std::size_t penultimateColons = className.rfind("::", lastColons - 1);
        if (penultimateColons == std::string::npos)
            penultimateColons = 1;
        className = className.substr(penultimateColons, lastColons - penultimateColons);
    }
    return className;
}

}  // end namespace Catch
// end catch_test_case_registry_impl.cpp
// start catch_test_case_tracker.cpp

#include <algorithm>
#include <cassert>
#include <memory>
#include <sstream>
#include <stdexcept>

#if defined(__clang__)
#pragma clang diagnostic push
#pragma clang diagnostic ignored "-Wexit-time-destructors"
#endif

namespace Catch {
namespace TestCaseTracking {

NameAndLocation::NameAndLocation(std::string const &_name, SourceLineInfo const &_location)
        : name(_name), location(_location) {}

ITracker::~ITracker() = default;

ITracker &TrackerContext::startRun() {
    m_rootTracker = std::make_shared<SectionTracker>(
            NameAndLocation("{root}", CATCH_INTERNAL_LINEINFO), *this, nullptr);
    m_currentTracker = nullptr;
    m_runState = Executing;
    return *m_rootTracker;
}

void TrackerContext::endRun() {
    m_rootTracker.reset();
    m_currentTracker = nullptr;
    m_runState = NotStarted;
}

void TrackerContext::startCycle() {
    m_currentTracker = m_rootTracker.get();
    m_runState = Executing;
}
void TrackerContext::completeCycle() { m_runState = CompletedCycle; }

bool TrackerContext::completedCycle() const { return m_runState == CompletedCycle; }
ITracker &TrackerContext::currentTracker() { return *m_currentTracker; }
void TrackerContext::setCurrentTracker(ITracker *tracker) { m_currentTracker = tracker; }

TrackerBase::TrackerBase(NameAndLocation const &nameAndLocation,
                         TrackerContext &ctx,
                         ITracker *parent)
        : ITracker(nameAndLocation), m_ctx(ctx), m_parent(parent) {}

bool TrackerBase::isComplete() const {
    return m_runState == CompletedSuccessfully || m_runState == Failed;
}
bool TrackerBase::isSuccessfullyCompleted() const { return m_runState == CompletedSuccessfully; }
bool TrackerBase::isOpen() const { return m_runState != NotStarted && !isComplete(); }
bool TrackerBase::hasChildren() const { return !m_children.empty(); }

void TrackerBase::addChild(ITrackerPtr const &child) { m_children.push_back(child); }

ITrackerPtr TrackerBase::findChild(NameAndLocation const &nameAndLocation) {
    auto it = std::find_if(
            m_children.begin(), m_children.end(), [&nameAndLocation](ITrackerPtr const &tracker) {
                return tracker->nameAndLocation().location == nameAndLocation.location &&
                       tracker->nameAndLocation().name == nameAndLocation.name;
            });
    return (it != m_children.end()) ? *it : nullptr;
}
ITracker &TrackerBase::parent() {
    assert(m_parent);  // Should always be non-null except for root
    return *m_parent;
}

void TrackerBase::openChild() {
    if (m_runState != ExecutingChildren) {
        m_runState = ExecutingChildren;
        if (m_parent)
            m_parent->openChild();
    }
}

bool TrackerBase::isSectionTracker() const { return false; }
bool TrackerBase::isGeneratorTracker() const { return false; }

void TrackerBase::open() {
    m_runState = Executing;
    moveToThis();
    if (m_parent)
        m_parent->openChild();
}

void TrackerBase::close() {
    // Close any still open children (e.g. generators)
    while (&m_ctx.currentTracker() != this)
        m_ctx.currentTracker().close();

    switch (m_runState) {
    case NeedsAnotherRun:
        break;

    case Executing:
        m_runState = CompletedSuccessfully;
        break;
    case ExecutingChildren:
        if (std::all_of(m_children.begin(), m_children.end(),
                        [](ITrackerPtr const &t) { return t->isComplete(); }))
            m_runState = CompletedSuccessfully;
        break;

    case NotStarted:
    case CompletedSuccessfully:
    case Failed:
        CATCH_INTERNAL_ERROR("Illogical state: " << m_runState);

    default:
        CATCH_INTERNAL_ERROR("Unknown state: " << m_runState);
    }
    moveToParent();
    m_ctx.completeCycle();
}
void TrackerBase::fail() {
    m_runState = Failed;
    if (m_parent)
        m_parent->markAsNeedingAnotherRun();
    moveToParent();
    m_ctx.completeCycle();
}
void TrackerBase::markAsNeedingAnotherRun() { m_runState = NeedsAnotherRun; }

void TrackerBase::moveToParent() {
    assert(m_parent);
    m_ctx.setCurrentTracker(m_parent);
}
void TrackerBase::moveToThis() { m_ctx.setCurrentTracker(this); }

SectionTracker::SectionTracker(NameAndLocation const &nameAndLocation,
                               TrackerContext &ctx,
                               ITracker *parent)
        : TrackerBase(nameAndLocation, ctx, parent), m_trimmed_name(trim(nameAndLocation.name)) {
    if (parent) {
        while (!parent->isSectionTracker())
            parent = &parent->parent();

        SectionTracker &parentSection = static_cast<SectionTracker &>(*parent);
        addNextFilters(parentSection.m_filters);
    }
}

bool SectionTracker::isComplete() const {
    bool complete = true;

    if (m_filters.empty() || m_filters[0] == "" ||
        std::find(m_filters.begin(), m_filters.end(), m_trimmed_name) != m_filters.end()) {
        complete = TrackerBase::isComplete();
    }
    return complete;
}

bool SectionTracker::isSectionTracker() const { return true; }

SectionTracker &SectionTracker::acquire(TrackerContext &ctx,
                                        NameAndLocation const &nameAndLocation) {
    std::shared_ptr<SectionTracker> section;

    ITracker &currentTracker = ctx.currentTracker();
    if (ITrackerPtr childTracker = currentTracker.findChild(nameAndLocation)) {
        assert(childTracker);
        assert(childTracker->isSectionTracker());
        section = std::static_pointer_cast<SectionTracker>(childTracker);
    } else {
        section = std::make_shared<SectionTracker>(nameAndLocation, ctx, &currentTracker);
        currentTracker.addChild(section);
    }
    if (!ctx.completedCycle())
        section->tryOpen();
    return *section;
}

void SectionTracker::tryOpen() {
    if (!isComplete())
        open();
}

void SectionTracker::addInitialFilters(std::vector<std::string> const &filters) {
    if (!filters.empty()) {
        m_filters.reserve(m_filters.size() + filters.size() + 2);
        m_filters.emplace_back("");  // Root - should never be consulted
        m_filters.emplace_back("");  // Test Case - not a section filter
        m_filters.insert(m_filters.end(), filters.begin(), filters.end());
    }
}
void SectionTracker::addNextFilters(std::vector<std::string> const &filters) {
    if (filters.size() > 1)
        m_filters.insert(m_filters.end(), filters.begin() + 1, filters.end());
}

std::vector<std::string> const &SectionTracker::getFilters() const { return m_filters; }

std::string const &SectionTracker::trimmedName() const { return m_trimmed_name; }

}  // namespace TestCaseTracking

using TestCaseTracking::ITracker;
using TestCaseTracking::SectionTracker;
using TestCaseTracking::TrackerContext;

}  // namespace Catch

#if defined(__clang__)
#pragma clang diagnostic pop
#endif
// end catch_test_case_tracker.cpp
// start catch_test_registry.cpp

namespace Catch {

auto makeTestInvoker(void (*testAsFunction)()) noexcept -> ITestInvoker * {
    return new (std::nothrow) TestInvokerAsFunction(testAsFunction);
}

NameAndTags::NameAndTags(StringRef const &name_, StringRef const &tags_) noexcept
        : name(name_), tags(tags_) {}

AutoReg::AutoReg(ITestInvoker *invoker,
                 SourceLineInfo const &lineInfo,
                 StringRef const &classOrMethod,
                 NameAndTags const &nameAndTags) noexcept {
    CATCH_TRY {
        getMutableRegistryHub().registerTest(
                makeTestCase(invoker, extractClassName(classOrMethod), nameAndTags, lineInfo));
    }
    CATCH_CATCH_ALL {
        // Do not throw when constructing global objects, instead register the
        // exception to be processed later
        getMutableRegistryHub().registerStartupException();
    }
}

AutoReg::~AutoReg() = default;
}  // namespace Catch
// end catch_test_registry.cpp
// start catch_test_spec.cpp

#include <algorithm>
#include <memory>
#include <string>
#include <vector>

namespace Catch {

TestSpec::Pattern::Pattern(std::string const &name) : m_name(name) {}

TestSpec::Pattern::~Pattern() = default;

std::string const &TestSpec::Pattern::name() const { return m_name; }

TestSpec::NamePattern::NamePattern(std::string const &name, std::string const &filterString)
        : Pattern(filterString), m_wildcardPattern(toLower(name), CaseSensitive::No) {}

bool TestSpec::NamePattern::matches(TestCaseInfo const &testCase) const {
    return m_wildcardPattern.matches(testCase.name);
}

TestSpec::TagPattern::TagPattern(std::string const &tag, std::string const &filterString)
        : Pattern(filterString), m_tag(toLower(tag)) {}

bool TestSpec::TagPattern::matches(TestCaseInfo const &testCase) const {
    return std::find(begin(testCase.lcaseTags), end(testCase.lcaseTags), m_tag) !=
           end(testCase.lcaseTags);
}

TestSpec::ExcludedPattern::ExcludedPattern(PatternPtr const &underlyingPattern)
        : Pattern(underlyingPattern->name()), m_underlyingPattern(underlyingPattern) {}

bool TestSpec::ExcludedPattern::matches(TestCaseInfo const &testCase) const {
    return !m_underlyingPattern->matches(testCase);
}

bool TestSpec::Filter::matches(TestCaseInfo const &testCase) const {
    return std::all_of(m_patterns.begin(), m_patterns.end(),
                       [&](PatternPtr const &p) { return p->matches(testCase); });
}

std::string TestSpec::Filter::name() const {
    std::string name;
    for (auto const &p : m_patterns)
        name += p->name();
    return name;
}

bool TestSpec::hasFilters() const { return !m_filters.empty(); }

bool TestSpec::matches(TestCaseInfo const &testCase) const {
    return std::any_of(m_filters.begin(), m_filters.end(),
                       [&](Filter const &f) { return f.matches(testCase); });
}

TestSpec::Matches TestSpec::matchesByFilter(std::vector<TestCase> const &testCases,
                                            IConfig const &config) const {
    Matches matches(m_filters.size());
    std::transform(m_filters.begin(), m_filters.end(), matches.begin(), [&](Filter const &filter) {
        std::vector<TestCase const *> currentMatches;
        for (auto const &test : testCases)
            if (isThrowSafe(test, config) && filter.matches(test))
                currentMatches.emplace_back(&test);
        return FilterMatch{filter.name(), currentMatches};
    });
    return matches;
}

const TestSpec::vectorStrings &TestSpec::getInvalidArgs() const { return (m_invalidArgs); }

}  // namespace Catch
// end catch_test_spec.cpp
// start catch_test_spec_parser.cpp

namespace Catch {

TestSpecParser::TestSpecParser(ITagAliasRegistry const &tagAliases) : m_tagAliases(&tagAliases) {}

TestSpecParser &TestSpecParser::parse(std::string const &arg) {
    m_mode = None;
    m_exclusion = false;
    m_arg = m_tagAliases->expandAliases(arg);
    m_escapeChars.clear();
    m_substring.reserve(m_arg.size());
    m_patternName.reserve(m_arg.size());
    m_realPatternPos = 0;

    for (m_pos = 0; m_pos < m_arg.size(); ++m_pos)
        // if visitChar fails
        if (!visitChar(m_arg[m_pos])) {
            m_testSpec.m_invalidArgs.push_back(arg);
            break;
        }
    endMode();
    return *this;
}
TestSpec TestSpecParser::testSpec() {
    addFilter();
    return m_testSpec;
}
bool TestSpecParser::visitChar(char c) {
    if ((m_mode != EscapedName) && (c == '\\')) {
        escape();
        addCharToPattern(c);
        return true;
    } else if ((m_mode != EscapedName) && (c == ',')) {
        return separate();
    }

    switch (m_mode) {
    case None:
        if (processNoneChar(c))
            return true;
        break;
    case Name:
        processNameChar(c);
        break;
    case EscapedName:
        endMode();
        addCharToPattern(c);
        return true;
    default:
    case Tag:
    case QuotedName:
        if (processOtherChar(c))
            return true;
        break;
    }

    m_substring += c;
    if (!isControlChar(c)) {
        m_patternName += c;
        m_realPatternPos++;
    }
    return true;
}
// Two of the processing methods return true to signal the caller to return
// without adding the given character to the current pattern strings
bool TestSpecParser::processNoneChar(char c) {
    switch (c) {
    case ' ':
        return true;
    case '~':
        m_exclusion = true;
        return false;
    case '[':
        startNewMode(Tag);
        return false;
    case '"':
        startNewMode(QuotedName);
        return false;
    default:
        startNewMode(Name);
        return false;
    }
}
void TestSpecParser::processNameChar(char c) {
    if (c == '[') {
        if (m_substring == "exclude:")
            m_exclusion = true;
        else
            endMode();
        startNewMode(Tag);
    }
}
bool TestSpecParser::processOtherChar(char c) {
    if (!isControlChar(c))
        return false;
    m_substring += c;
    endMode();
    return true;
}
void TestSpecParser::startNewMode(Mode mode) { m_mode = mode; }
void TestSpecParser::endMode() {
    switch (m_mode) {
    case Name:
    case QuotedName:
        return addNamePattern();
    case Tag:
        return addTagPattern();
    case EscapedName:
        revertBackToLastMode();
        return;
    case None:
    default:
        return startNewMode(None);
    }
}
void TestSpecParser::escape() {
    saveLastMode();
    m_mode = EscapedName;
    m_escapeChars.push_back(m_realPatternPos);
}
bool TestSpecParser::isControlChar(char c) const {
    switch (m_mode) {
    default:
        return false;
    case None:
        return c == '~';
    case Name:
        return c == '[';
    case EscapedName:
        return true;
    case QuotedName:
        return c == '"';
    case Tag:
        return c == '[' || c == ']';
    }
}

void TestSpecParser::addFilter() {
    if (!m_currentFilter.m_patterns.empty()) {
        m_testSpec.m_filters.push_back(m_currentFilter);
        m_currentFilter = TestSpec::Filter();
    }
}

void TestSpecParser::saveLastMode() { lastMode = m_mode; }

void TestSpecParser::revertBackToLastMode() { m_mode = lastMode; }

bool TestSpecParser::separate() {
    if ((m_mode == QuotedName) || (m_mode == Tag)) {
        // invalid argument, signal failure to previous scope.
        m_mode = None;
        m_pos = m_arg.size();
        m_substring.clear();
        m_patternName.clear();
        m_realPatternPos = 0;
        return false;
    }
    endMode();
    addFilter();
    return true;  // success
}

std::string TestSpecParser::preprocessPattern() {
    std::string token = m_patternName;
    for (std::size_t i = 0; i < m_escapeChars.size(); ++i)
        token = token.substr(0, m_escapeChars[i] - i) + token.substr(m_escapeChars[i] - i + 1);
    m_escapeChars.clear();
    if (startsWith(token, "exclude:")) {
        m_exclusion = true;
        token = token.substr(8);
    }

    m_patternName.clear();
    m_realPatternPos = 0;

    return token;
}

void TestSpecParser::addNamePattern() {
    auto token = preprocessPattern();

    if (!token.empty()) {
        TestSpec::PatternPtr pattern = std::make_shared<TestSpec::NamePattern>(token, m_substring);
        if (m_exclusion)
            pattern = std::make_shared<TestSpec::ExcludedPattern>(pattern);
        m_currentFilter.m_patterns.push_back(pattern);
    }
    m_substring.clear();
    m_exclusion = false;
    m_mode = None;
}

void TestSpecParser::addTagPattern() {
    auto token = preprocessPattern();

    if (!token.empty()) {
        // If the tag pattern is the "hide and tag" shorthand (e.g. [.foo])
        // we have to create a separate hide tag and shorten the real one
        if (token.size() > 1 && token[0] == '.') {
            token.erase(token.begin());
            TestSpec::PatternPtr pattern = std::make_shared<TestSpec::TagPattern>(".", m_substring);
            if (m_exclusion) {
                pattern = std::make_shared<TestSpec::ExcludedPattern>(pattern);
            }
            m_currentFilter.m_patterns.push_back(pattern);
        }

        TestSpec::PatternPtr pattern = std::make_shared<TestSpec::TagPattern>(token, m_substring);

        if (m_exclusion) {
            pattern = std::make_shared<TestSpec::ExcludedPattern>(pattern);
        }
        m_currentFilter.m_patterns.push_back(pattern);
    }
    m_substring.clear();
    m_exclusion = false;
    m_mode = None;
}

TestSpec parseTestSpec(std::string const &arg) {
    return TestSpecParser(ITagAliasRegistry::get()).parse(arg).testSpec();
}

}  // namespace Catch
// end catch_test_spec_parser.cpp
// start catch_timer.cpp

#include <chrono>

static const uint64_t nanosecondsInSecond = 1000000000;

namespace Catch {

auto getCurrentNanosecondsSinceEpoch() -> uint64_t {
    return std::chrono::duration_cast<std::chrono::nanoseconds>(
                   std::chrono::high_resolution_clock::now().time_since_epoch())
            .count();
}

namespace {
auto estimateClockResolution() -> uint64_t {
    uint64_t sum = 0;
    static const uint64_t iterations = 1000000;

    auto startTime = getCurrentNanosecondsSinceEpoch();

    for (std::size_t i = 0; i < iterations; ++i) {
        uint64_t ticks;
        uint64_t baseTicks = getCurrentNanosecondsSinceEpoch();
        do {
            ticks = getCurrentNanosecondsSinceEpoch();
        } while (ticks == baseTicks);

        auto delta = ticks - baseTicks;
        sum += delta;

        // If we have been calibrating for over 3 seconds -- the clock
        // is terrible and we should move on.
        // TBD: How to signal that the measured resolution is probably wrong?
        if (ticks > startTime + 3 * nanosecondsInSecond) {
            return sum / (i + 1u);
        }
    }

    // We're just taking the mean, here. To do better we could take the std. dev
    // and exclude outliers
    // - and potentially do more iterations if there's a high variance.
    return sum / iterations;
}
}  // namespace
auto getEstimatedClockResolution() -> uint64_t {
    static auto s_resolution = estimateClockResolution();
    return s_resolution;
}

void Timer::start() { m_nanoseconds = getCurrentNanosecondsSinceEpoch(); }
auto Timer::getElapsedNanoseconds() const -> uint64_t {
    return getCurrentNanosecondsSinceEpoch() - m_nanoseconds;
}
auto Timer::getElapsedMicroseconds() const -> uint64_t { return getElapsedNanoseconds() / 1000; }
auto Timer::getElapsedMilliseconds() const -> unsigned int {
    return static_cast<unsigned int>(getElapsedMicroseconds() / 1000);
}
auto Timer::getElapsedSeconds() const -> double { return getElapsedMicroseconds() / 1000000.0; }

}  // namespace Catch
// end catch_timer.cpp
// start catch_tostring.cpp

#if defined(__clang__)
#pragma clang diagnostic push
#pragma clang diagnostic ignored "-Wexit-time-destructors"
#pragma clang diagnostic ignored "-Wglobal-constructors"
#endif

// Enable specific decls locally
#if !defined(CATCH_CONFIG_ENABLE_CHRONO_STRINGMAKER)
#define CATCH_CONFIG_ENABLE_CHRONO_STRINGMAKER
#endif

#include <cmath>
#include <iomanip>

namespace Catch {

namespace Detail {

const std::string unprintableString = "{?}";

namespace {
const int hexThreshold = 255;

struct Endianness {
    enum Arch { Big, Little };

    static Arch which() {
        int one = 1;
        // If the lowest byte we read is non-zero, we can assume
        // that little endian format is used.
        auto value = *reinterpret_cast<char *>(&one);
        return value ? Little : Big;
    }
};
}  // namespace

std::string rawMemoryToString(const void *object, std::size_t size) {
    // Reverse order for little endian architectures
    int i = 0, end = static_cast<int>(size), inc = 1;
    if (Endianness::which() == Endianness::Little) {
        i = end - 1;
        end = inc = -1;
    }

    unsigned char const *bytes = static_cast<unsigned char const *>(object);
    ReusableStringStream rss;
    rss << "0x" << std::setfill('0') << std::hex;
    for (; i != end; i += inc)
        rss << std::setw(2) << static_cast<unsigned>(bytes[i]);
    return rss.str();
}
}  // namespace Detail

template <typename T>
std::string fpToString(T value, int precision) {
    if (Catch::isnan(value)) {
        return "nan";
    }

    ReusableStringStream rss;
    rss << std::setprecision(precision) << std::fixed << value;
    std::string d = rss.str();
    std::size_t i = d.find_last_not_of('0');
    if (i != std::string::npos && i != d.size() - 1) {
        if (d[i] == '.')
            i++;
        d = d.substr(0, i + 1);
    }
    return d;
}

//// ======================================================= ////
//
//   Out-of-line defs for full specialization of StringMaker
//
//// ======================================================= ////

std::string StringMaker<std::string>::convert(const std::string &str) {
    if (!getCurrentContext().getConfig()->showInvisibles()) {
        return '"' + str + '"';
    }

    std::string s("\"");
    for (char c : str) {
        switch (c) {
        case '\n':
            s.append("\\n");
            break;
        case '\t':
            s.append("\\t");
            break;
        default:
            s.push_back(c);
            break;
        }
    }
    s.append("\"");
    return s;
}

#ifdef CATCH_CONFIG_CPP17_STRING_VIEW
std::string StringMaker<std::string_view>::convert(std::string_view str) {
    return ::Catch::Detail::stringify(std::string{str});
}
#endif

std::string StringMaker<char const *>::convert(char const *str) {
    if (str) {
        return ::Catch::Detail::stringify(std::string{str});
    } else {
        return {"{null string}"};
    }
}
std::string StringMaker<char *>::convert(char *str) {
    if (str) {
        return ::Catch::Detail::stringify(std::string{str});
    } else {
        return {"{null string}"};
    }
}

#ifdef CATCH_CONFIG_WCHAR
std::string StringMaker<std::wstring>::convert(const std::wstring &wstr) {
    std::string s;
    s.reserve(wstr.size());
    for (auto c : wstr) {
        s += (c <= 0xff) ? static_cast<char>(c) : '?';
    }
    return ::Catch::Detail::stringify(s);
}

#ifdef CATCH_CONFIG_CPP17_STRING_VIEW
std::string StringMaker<std::wstring_view>::convert(std::wstring_view str) {
    return StringMaker<std::wstring>::convert(std::wstring(str));
}
#endif

std::string StringMaker<wchar_t const *>::convert(wchar_t const *str) {
    if (str) {
        return ::Catch::Detail::stringify(std::wstring{str});
    } else {
        return {"{null string}"};
    }
}
std::string StringMaker<wchar_t *>::convert(wchar_t *str) {
    if (str) {
        return ::Catch::Detail::stringify(std::wstring{str});
    } else {
        return {"{null string}"};
    }
}
#endif

#if defined(CATCH_CONFIG_CPP17_BYTE)
#include <cstddef>
std::string StringMaker<std::byte>::convert(std::byte value) {
    return ::Catch::Detail::stringify(std::to_integer<unsigned long long>(value));
}
#endif  // defined(CATCH_CONFIG_CPP17_BYTE)

std::string StringMaker<int>::convert(int value) {
    return ::Catch::Detail::stringify(static_cast<long long>(value));
}
std::string StringMaker<long>::convert(long value) {
    return ::Catch::Detail::stringify(static_cast<long long>(value));
}
std::string StringMaker<long long>::convert(long long value) {
    ReusableStringStream rss;
    rss << value;
    if (value > Detail::hexThreshold) {
        rss << " (0x" << std::hex << value << ')';
    }
    return rss.str();
}

std::string StringMaker<unsigned int>::convert(unsigned int value) {
    return ::Catch::Detail::stringify(static_cast<unsigned long long>(value));
}
std::string StringMaker<unsigned long>::convert(unsigned long value) {
    return ::Catch::Detail::stringify(static_cast<unsigned long long>(value));
}
std::string StringMaker<unsigned long long>::convert(unsigned long long value) {
    ReusableStringStream rss;
    rss << value;
    if (value > Detail::hexThreshold) {
        rss << " (0x" << std::hex << value << ')';
    }
    return rss.str();
}

std::string StringMaker<bool>::convert(bool b) { return b ? "true" : "false"; }

std::string StringMaker<signed char>::convert(signed char value) {
    if (value == '\r') {
        return "'\\r'";
    } else if (value == '\f') {
        return "'\\f'";
    } else if (value == '\n') {
        return "'\\n'";
    } else if (value == '\t') {
        return "'\\t'";
    } else if ('\0' <= value && value < ' ') {
        return ::Catch::Detail::stringify(static_cast<unsigned int>(value));
    } else {
        char chstr[] = "' '";
        chstr[1] = value;
        return chstr;
    }
}
std::string StringMaker<char>::convert(char c) {
    return ::Catch::Detail::stringify(static_cast<signed char>(c));
}
std::string StringMaker<unsigned char>::convert(unsigned char c) {
    return ::Catch::Detail::stringify(static_cast<char>(c));
}

std::string StringMaker<std::nullptr_t>::convert(std::nullptr_t) { return "nullptr"; }

int StringMaker<float>::precision = 5;

std::string StringMaker<float>::convert(float value) { return fpToString(value, precision) + 'f'; }

int StringMaker<double>::precision = 10;

std::string StringMaker<double>::convert(double value) { return fpToString(value, precision); }

std::string ratio_string<std::atto>::symbol() { return "a"; }
std::string ratio_string<std::femto>::symbol() { return "f"; }
std::string ratio_string<std::pico>::symbol() { return "p"; }
std::string ratio_string<std::nano>::symbol() { return "n"; }
std::string ratio_string<std::micro>::symbol() { return "u"; }
std::string ratio_string<std::milli>::symbol() { return "m"; }

}  // end namespace Catch

#if defined(__clang__)
#pragma clang diagnostic pop
#endif

// end catch_tostring.cpp
// start catch_totals.cpp

namespace Catch {

Counts Counts::operator-(Counts const &other) const {
    Counts diff;
    diff.passed = passed - other.passed;
    diff.failed = failed - other.failed;
    diff.failedButOk = failedButOk - other.failedButOk;
    return diff;
}

Counts &Counts::operator+=(Counts const &other) {
    passed += other.passed;
    failed += other.failed;
    failedButOk += other.failedButOk;
    return *this;
}

std::size_t Counts::total() const { return passed + failed + failedButOk; }
bool Counts::allPassed() const { return failed == 0 && failedButOk == 0; }
bool Counts::allOk() const { return failed == 0; }

Totals Totals::operator-(Totals const &other) const {
    Totals diff;
    diff.assertions = assertions - other.assertions;
    diff.testCases = testCases - other.testCases;
    return diff;
}

Totals &Totals::operator+=(Totals const &other) {
    assertions += other.assertions;
    testCases += other.testCases;
    return *this;
}

Totals Totals::delta(Totals const &prevTotals) const {
    Totals diff = *this - prevTotals;
    if (diff.assertions.failed > 0)
        ++diff.testCases.failed;
    else if (diff.assertions.failedButOk > 0)
        ++diff.testCases.failedButOk;
    else
        ++diff.testCases.passed;
    return diff;
}

}  // namespace Catch
// end catch_totals.cpp
// start catch_uncaught_exceptions.cpp

// start catch_config_uncaught_exceptions.hpp

//              Copyright Catch2 Authors
// Distributed under the Boost Software License, Version 1.0.
//   (See accompanying file LICENSE_1_0.txt or copy at
//        https://www.boost.org/LICENSE_1_0.txt)

// SPDX-License-Identifier: BSL-1.0

#ifndef CATCH_CONFIG_UNCAUGHT_EXCEPTIONS_HPP
#define CATCH_CONFIG_UNCAUGHT_EXCEPTIONS_HPP

#if defined(_MSC_VER)
#if _MSC_VER >= 1900  // Visual Studio 2015 or newer
#define CATCH_INTERNAL_CONFIG_CPP17_UNCAUGHT_EXCEPTIONS
#endif
#endif

#include <exception>

#if defined(__cpp_lib_uncaught_exceptions) && \
        !defined(CATCH_INTERNAL_CONFIG_CPP17_UNCAUGHT_EXCEPTIONS)

#define CATCH_INTERNAL_CONFIG_CPP17_UNCAUGHT_EXCEPTIONS
#endif  // __cpp_lib_uncaught_exceptions

#if defined(CATCH_INTERNAL_CONFIG_CPP17_UNCAUGHT_EXCEPTIONS) && \
        !defined(CATCH_CONFIG_NO_CPP17_UNCAUGHT_EXCEPTIONS) &&  \
        !defined(CATCH_CONFIG_CPP17_UNCAUGHT_EXCEPTIONS)

#define CATCH_CONFIG_CPP17_UNCAUGHT_EXCEPTIONS
#endif

#endif  // CATCH_CONFIG_UNCAUGHT_EXCEPTIONS_HPP
// end catch_config_uncaught_exceptions.hpp
#include <exception>

namespace Catch {
bool uncaught_exceptions() {
#if defined(CATCH_CONFIG_DISABLE_EXCEPTIONS)
    return false;
#elif defined(CATCH_CONFIG_CPP17_UNCAUGHT_EXCEPTIONS)
    return std::uncaught_exceptions() > 0;
#else
    return std::uncaught_exception();
#endif
}
}  // end namespace Catch
// end catch_uncaught_exceptions.cpp
// start catch_version.cpp

#include <ostream>

namespace Catch {

Version::Version(unsigned int _majorVersion,
                 unsigned int _minorVersion,
                 unsigned int _patchNumber,
                 char const *const _branchName,
                 unsigned int _buildNumber)
        : majorVersion(_majorVersion),
          minorVersion(_minorVersion),
          patchNumber(_patchNumber),
          branchName(_branchName),
          buildNumber(_buildNumber) {}

std::ostream &operator<<(std::ostream &os, Version const &version) {
    os << version.majorVersion << '.' << version.minorVersion << '.' << version.patchNumber;
    // branchName is never null -> 0th char is \0 if it is empty
    if (version.branchName[0]) {
        os << '-' << version.branchName << '.' << version.buildNumber;
    }
    return os;
}

Version const &libraryVersion() {
    static Version version(2, 13, 7, "", 0);
    return version;
}

}  // namespace Catch
// end catch_version.cpp
// start catch_wildcard_pattern.cpp

namespace Catch {

WildcardPattern::WildcardPattern(std::string const &pattern, CaseSensitive::Choice caseSensitivity)
        : m_caseSensitivity(caseSensitivity), m_pattern(normaliseString(pattern)) {
    if (startsWith(m_pattern, '*')) {
        m_pattern = m_pattern.substr(1);
        m_wildcard = WildcardAtStart;
    }
    if (endsWith(m_pattern, '*')) {
        m_pattern = m_pattern.substr(0, m_pattern.size() - 1);
        m_wildcard = static_cast<WildcardPosition>(m_wildcard | WildcardAtEnd);
    }
}

bool WildcardPattern::matches(std::string const &str) const {
    switch (m_wildcard) {
    case NoWildcard:
        return m_pattern == normaliseString(str);
    case WildcardAtStart:
        return endsWith(normaliseString(str), m_pattern);
    case WildcardAtEnd:
        return startsWith(normaliseString(str), m_pattern);
    case WildcardAtBothEnds:
        return contains(normaliseString(str), m_pattern);
    default:
        CATCH_INTERNAL_ERROR("Unknown enum");
    }
}

std::string WildcardPattern::normaliseString(std::string const &str) const {
    return trim(m_caseSensitivity == CaseSensitive::No ? toLower(str) : str);
}
}  // namespace Catch
// end catch_wildcard_pattern.cpp
// start catch_xmlwriter.cpp

#include <iomanip>
#include <type_traits>

namespace Catch {

namespace {

size_t trailingBytes(unsigned char c) {
    if ((c & 0xE0) == 0xC0) {
        return 2;
    }
    if ((c & 0xF0) == 0xE0) {
        return 3;
    }
    if ((c & 0xF8) == 0xF0) {
        return 4;
    }
    CATCH_INTERNAL_ERROR("Invalid multibyte utf-8 start byte encountered");
}

uint32_t headerValue(unsigned char c) {
    if ((c & 0xE0) == 0xC0) {
        return c & 0x1F;
    }
    if ((c & 0xF0) == 0xE0) {
        return c & 0x0F;
    }
    if ((c & 0xF8) == 0xF0) {
        return c & 0x07;
    }
    CATCH_INTERNAL_ERROR("Invalid multibyte utf-8 start byte encountered");
}

void hexEscapeChar(std::ostream &os, unsigned char c) {
    std::ios_base::fmtflags f(os.flags());
    os << "\\x" << std::uppercase << std::hex << std::setfill('0') << std::setw(2)
       << static_cast<int>(c);
    os.flags(f);
}

bool shouldNewline(XmlFormatting fmt) {
    return !!(static_cast<std::underlying_type<XmlFormatting>::type>(fmt & XmlFormatting::Newline));
}

bool shouldIndent(XmlFormatting fmt) {
    return !!(static_cast<std::underlying_type<XmlFormatting>::type>(fmt & XmlFormatting::Indent));
}

}  // anonymous namespace

XmlFormatting operator|(XmlFormatting lhs, XmlFormatting rhs) {
    return static_cast<XmlFormatting>(static_cast<std::underlying_type<XmlFormatting>::type>(lhs) |
                                      static_cast<std::underlying_type<XmlFormatting>::type>(rhs));
}

XmlFormatting operator&(XmlFormatting lhs, XmlFormatting rhs) {
    return static_cast<XmlFormatting>(static_cast<std::underlying_type<XmlFormatting>::type>(lhs) &
                                      static_cast<std::underlying_type<XmlFormatting>::type>(rhs));
}

XmlEncode::XmlEncode(std::string const &str, ForWhat forWhat) : m_str(str), m_forWhat(forWhat) {}

void XmlEncode::encodeTo(std::ostream &os) const {
    // Apostrophe escaping not necessary if we always use " to write attributes
    // (see: http://www.w3.org/TR/xml/#syntax)

    for (std::size_t idx = 0; idx < m_str.size(); ++idx) {
        unsigned char c = m_str[idx];
        switch (c) {
        case '<':
            os << "&lt;";
            break;
        case '&':
            os << "&amp;";
            break;

        case '>':
            // See: http://www.w3.org/TR/xml/#syntax
            if (idx > 2 && m_str[idx - 1] == ']' && m_str[idx - 2] == ']')
                os << "&gt;";
            else
                os << c;
            break;

        case '\"':
            if (m_forWhat == ForAttributes)
                os << "&quot;";
            else
                os << c;
            break;

        default:
            // Check for control characters and invalid utf-8

            // Escape control characters in standard ascii
            // see
            // http://stackoverflow.com/questions/404107/why-are-control-characters-illegal-in-xml-1-0
            if (c < 0x09 || (c > 0x0D && c < 0x20) || c == 0x7F) {
                hexEscapeChar(os, c);
                break;
            }

            // Plain ASCII: Write it to stream
            if (c < 0x7F) {
                os << c;
                break;
            }

            // UTF-8 territory
            // Check if the encoding is valid and if it is not, hex escape bytes.
            // Important: We do not check the exact decoded values for validity, only
            // the encoding format First check that this bytes is a valid lead byte:
            // This means that it is not encoded as 1111 1XXX
            // Or as 10XX XXXX
            if (c < 0xC0 || c >= 0xF8) {
                hexEscapeChar(os, c);
                break;
            }

            auto encBytes = trailingBytes(c);
            // Are there enough bytes left to avoid accessing out-of-bounds memory?
            if (idx + encBytes - 1 >= m_str.size()) {
                hexEscapeChar(os, c);
                break;
            }
            // The header is valid, check data
            // The next encBytes bytes must together be a valid utf-8
            // This means: bitpattern 10XX XXXX and the extracted value is sane (ish)
            bool valid = true;
            uint32_t value = headerValue(c);
            for (std::size_t n = 1; n < encBytes; ++n) {
                unsigned char nc = m_str[idx + n];
                valid &= ((nc & 0xC0) == 0x80);
                value = (value << 6) | (nc & 0x3F);
            }

            if (
                    // Wrong bit pattern of following bytes
                    (!valid) ||
                    // Overlong encodings
                    (value < 0x80) || (0x80 <= value && value < 0x800 && encBytes > 2) ||
                    (0x800 < value && value < 0x10000 && encBytes > 3) ||
                    // Encoded value out of range
                    (value >= 0x110000)) {
                hexEscapeChar(os, c);
                break;
            }

            // If we got here, this is in fact a valid(ish) utf-8 sequence
            for (std::size_t n = 0; n < encBytes; ++n) {
                os << m_str[idx + n];
            }
            idx += encBytes - 1;
            break;
        }
    }
}

std::ostream &operator<<(std::ostream &os, XmlEncode const &xmlEncode) {
    xmlEncode.encodeTo(os);
    return os;
}

XmlWriter::ScopedElement::ScopedElement(XmlWriter *writer, XmlFormatting fmt)
        : m_writer(writer), m_fmt(fmt) {}

XmlWriter::ScopedElement::ScopedElement(ScopedElement &&other) noexcept
        : m_writer(other.m_writer), m_fmt(other.m_fmt) {
    other.m_writer = nullptr;
    other.m_fmt = XmlFormatting::None;
}
XmlWriter::ScopedElement &XmlWriter::ScopedElement::operator=(ScopedElement &&other) noexcept {
    if (m_writer) {
        m_writer->endElement();
    }
    m_writer = other.m_writer;
    other.m_writer = nullptr;
    m_fmt = other.m_fmt;
    other.m_fmt = XmlFormatting::None;
    return *this;
}

XmlWriter::ScopedElement::~ScopedElement() {
    if (m_writer) {
        m_writer->endElement(m_fmt);
    }
}

XmlWriter::ScopedElement &XmlWriter::ScopedElement::writeText(std::string const &text,
                                                              XmlFormatting fmt) {
    m_writer->writeText(text, fmt);
    return *this;
}

XmlWriter::XmlWriter(std::ostream &os) : m_os(os) { writeDeclaration(); }

XmlWriter::~XmlWriter() {
    while (!m_tags.empty()) {
        endElement();
    }
    newlineIfNecessary();
}

XmlWriter &XmlWriter::startElement(std::string const &name, XmlFormatting fmt) {
    ensureTagClosed();
    newlineIfNecessary();
    if (shouldIndent(fmt)) {
        m_os << m_indent;
        m_indent += "  ";
    }
    m_os << '<' << name;
    m_tags.push_back(name);
    m_tagIsOpen = true;
    applyFormatting(fmt);
    return *this;
}

XmlWriter::ScopedElement XmlWriter::scopedElement(std::string const &name, XmlFormatting fmt) {
    ScopedElement scoped(this, fmt);
    startElement(name, fmt);
    return scoped;
}

XmlWriter &XmlWriter::endElement(XmlFormatting fmt) {
    m_indent = m_indent.substr(0, m_indent.size() - 2);

    if (m_tagIsOpen) {
        m_os << "/>";
        m_tagIsOpen = false;
    } else {
        newlineIfNecessary();
        if (shouldIndent(fmt)) {
            m_os << m_indent;
        }
        m_os << "</" << m_tags.back() << ">";
    }
    m_os << std::flush;
    applyFormatting(fmt);
    m_tags.pop_back();
    return *this;
}

XmlWriter &XmlWriter::writeAttribute(std::string const &name, std::string const &attribute) {
    if (!name.empty() && !attribute.empty())
        m_os << ' ' << name << "=\"" << XmlEncode(attribute, XmlEncode::ForAttributes) << '"';
    return *this;
}

XmlWriter &XmlWriter::writeAttribute(std::string const &name, bool attribute) {
    m_os << ' ' << name << "=\"" << (attribute ? "true" : "false") << '"';
    return *this;
}

XmlWriter &XmlWriter::writeText(std::string const &text, XmlFormatting fmt) {
    if (!text.empty()) {
        bool tagWasOpen = m_tagIsOpen;
        ensureTagClosed();
        if (tagWasOpen && shouldIndent(fmt)) {
            m_os << m_indent;
        }
        m_os << XmlEncode(text);
        applyFormatting(fmt);
    }
    return *this;
}

XmlWriter &XmlWriter::writeComment(std::string const &text, XmlFormatting fmt) {
    ensureTagClosed();
    if (shouldIndent(fmt)) {
        m_os << m_indent;
    }
    m_os << "<!--" << text << "-->";
    applyFormatting(fmt);
    return *this;
}

void XmlWriter::writeStylesheetRef(std::string const &url) {
    m_os << "<?xml-stylesheet type=\"text/xsl\" href=\"" << url << "\"?>\n";
}

XmlWriter &XmlWriter::writeBlankLine() {
    ensureTagClosed();
    m_os << '\n';
    return *this;
}

void XmlWriter::ensureTagClosed() {
    if (m_tagIsOpen) {
        m_os << '>' << std::flush;
        newlineIfNecessary();
        m_tagIsOpen = false;
    }
}

void XmlWriter::applyFormatting(XmlFormatting fmt) { m_needsNewline = shouldNewline(fmt); }

void XmlWriter::writeDeclaration() { m_os << "<?xml version=\"1.0\" encoding=\"UTF-8\"?>\n"; }

void XmlWriter::newlineIfNecessary() {
    if (m_needsNewline) {
        m_os << std::endl;
        m_needsNewline = false;
    }
}
}  // namespace Catch
// end catch_xmlwriter.cpp
// start catch_reporter_bases.cpp

#include <cassert>
#include <cfloat>
#include <cstdio>
#include <cstring>
#include <memory>

namespace Catch {
void prepareExpandedExpression(AssertionResult &result) { result.getExpandedExpression(); }

// Because formatting using c++ streams is stateful, drop down to C is required
// Alternatively we could use stringstream, but its performance is... not good.
std::string getFormattedDuration(double duration) {
    // Max exponent + 1 is required to represent the whole part
    // + 1 for decimal point
    // + 3 for the 3 decimal places
    // + 1 for null terminator
    const std::size_t maxDoubleSize = DBL_MAX_10_EXP + 1 + 1 + 3 + 1;
    char buffer[maxDoubleSize];

    // Save previous errno, to prevent sprintf from overwriting it
    ErrnoGuard guard;
#ifdef _MSC_VER
    sprintf_s(buffer, "%.3f", duration);
#else
    std::sprintf(buffer, "%.3f", duration);
#endif
    return std::string(buffer);
}

bool shouldShowDuration(IConfig const &config, double duration) {
    if (config.showDurations() == ShowDurations::Always) {
        return true;
    }
    if (config.showDurations() == ShowDurations::Never) {
        return false;
    }
    const double min = config.minDuration();
    return min >= 0 && duration >= min;
}

std::string serializeFilters(std::vector<std::string> const &container) {
    ReusableStringStream oss;
    bool first = true;
    for (auto &&filter : container) {
        if (!first)
            oss << ' ';
        else
            first = false;

        oss << filter;
    }
    return oss.str();
}

TestEventListenerBase::TestEventListenerBase(ReporterConfig const &_config)
        : StreamingReporterBase(_config) {}

std::set<Verbosity> TestEventListenerBase::getSupportedVerbosities() {
    return {Verbosity::Quiet, Verbosity::Normal, Verbosity::High};
}

void TestEventListenerBase::assertionStarting(AssertionInfo const &) {}

bool TestEventListenerBase::assertionEnded(AssertionStats const &) { return false; }

}  // end namespace Catch
// end catch_reporter_bases.cpp
// start catch_reporter_compact.cpp

namespace {

#ifdef CATCH_PLATFORM_MAC
const char *failedString() { return "FAILED"; }
const char *passedString() { return "PASSED"; }
#else
const char *failedString() { return "failed"; }
const char *passedString() { return "passed"; }
#endif

// Colour::LightGrey
Catch::Colour::Code dimColour() { return Catch::Colour::FileName; }

std::string bothOrAll(std::size_t count) {
    return count == 1 ? std::string() : count == 2 ? "both " : "all ";
}

}  // namespace

namespace Catch {
namespace {
// Colour, message variants:
// - white: No tests ran.
// -   red: Failed [both/all] N test cases, failed [both/all] M assertions.
// - white: Passed [both/all] N test cases (no assertions).
// -   red: Failed N tests cases, failed M assertions.
// - green: Passed [both/all] N tests cases with M assertions.
void printTotals(std::ostream &out, const Totals &totals) {
    if (totals.testCases.total() == 0) {
        out << "No tests ran.";
    } else if (totals.testCases.failed == totals.testCases.total()) {
        Colour colour(Colour::ResultError);
        const std::string qualify_assertions_failed =
                totals.assertions.failed == totals.assertions.total()
                        ? bothOrAll(totals.assertions.failed)
                        : std::string();
        out << "Failed " << bothOrAll(totals.testCases.failed)
            << pluralise(totals.testCases.failed, "test case")
            << ", "
               "failed "
            << qualify_assertions_failed << pluralise(totals.assertions.failed, "assertion") << '.';
    } else if (totals.assertions.total() == 0) {
        out << "Passed " << bothOrAll(totals.testCases.total())
            << pluralise(totals.testCases.total(), "test case") << " (no assertions).";
    } else if (totals.assertions.failed) {
        Colour colour(Colour::ResultError);
        out << "Failed " << pluralise(totals.testCases.failed, "test case")
            << ", "
               "failed "
            << pluralise(totals.assertions.failed, "assertion") << '.';
    } else {
        Colour colour(Colour::ResultSuccess);
        out << "Passed " << bothOrAll(totals.testCases.passed)
            << pluralise(totals.testCases.passed, "test case") << " with "
            << pluralise(totals.assertions.passed, "assertion") << '.';
    }
}

// Implementation of CompactReporter formatting
class AssertionPrinter {
public:
    AssertionPrinter &operator=(AssertionPrinter const &) = delete;
    AssertionPrinter(AssertionPrinter const &) = delete;
    AssertionPrinter(std::ostream &_stream, AssertionStats const &_stats, bool _printInfoMessages)
            : stream(_stream),
              result(_stats.assertionResult),
              messages(_stats.infoMessages),
              itMessage(_stats.infoMessages.begin()),
              printInfoMessages(_printInfoMessages) {}

    void print() {
        printSourceInfo();

        itMessage = messages.begin();

        switch (result.getResultType()) {
        case ResultWas::Ok:
            printResultType(Colour::ResultSuccess, passedString());
            printOriginalExpression();
            printReconstructedExpression();
            if (!result.hasExpression())
                printRemainingMessages(Colour::None);
            else
                printRemainingMessages();
            break;
        case ResultWas::ExpressionFailed:
            if (result.isOk())
                printResultType(Colour::ResultSuccess,
                                failedString() + std::string(" - but was ok"));
            else
                printResultType(Colour::Error, failedString());
            printOriginalExpression();
            printReconstructedExpression();
            printRemainingMessages();
            break;
        case ResultWas::ThrewException:
            printResultType(Colour::Error, failedString());
            printIssue("unexpected exception with message:");
            printMessage();
            printExpressionWas();
            printRemainingMessages();
            break;
        case ResultWas::FatalErrorCondition:
            printResultType(Colour::Error, failedString());
            printIssue("fatal error condition with message:");
            printMessage();
            printExpressionWas();
            printRemainingMessages();
            break;
        case ResultWas::DidntThrowException:
            printResultType(Colour::Error, failedString());
            printIssue("expected exception, got none");
            printExpressionWas();
            printRemainingMessages();
            break;
        case ResultWas::Info:
            printResultType(Colour::None, "info");
            printMessage();
            printRemainingMessages();
            break;
        case ResultWas::Warning:
            printResultType(Colour::None, "warning");
            printMessage();
            printRemainingMessages();
            break;
        case ResultWas::ExplicitFailure:
            printResultType(Colour::Error, failedString());
            printIssue("explicitly");
            printRemainingMessages(Colour::None);
            break;
            // These cases are here to prevent compiler warnings
        case ResultWas::Unknown:
        case ResultWas::FailureBit:
        case ResultWas::Exception:
            printResultType(Colour::Error, "** internal error **");
            break;
        }
    }

private:
    void printSourceInfo() const {
        Colour colourGuard(Colour::FileName);
        stream << result.getSourceInfo() << ':';
    }

    void printResultType(Colour::Code colour, std::string const &passOrFail) const {
        if (!passOrFail.empty()) {
            {
                Colour colourGuard(colour);
                stream << ' ' << passOrFail;
            }
            stream << ':';
        }
    }

    void printIssue(std::string const &issue) const { stream << ' ' << issue; }

    void printExpressionWas() {
        if (result.hasExpression()) {
            stream << ';';
            {
                Colour colour(dimColour());
                stream << " expression was:";
            }
            printOriginalExpression();
        }
    }

    void printOriginalExpression() const {
        if (result.hasExpression()) {
            stream << ' ' << result.getExpression();
        }
    }

    void printReconstructedExpression() const {
        if (result.hasExpandedExpression()) {
            {
                Colour colour(dimColour());
                stream << " for: ";
            }
            stream << result.getExpandedExpression();
        }
    }

    void printMessage() {
        if (itMessage != messages.end()) {
            stream << " '" << itMessage->message << '\'';
            ++itMessage;
        }
    }

    void printRemainingMessages(Colour::Code colour = dimColour()) {
        if (itMessage == messages.end())
            return;

        const auto itEnd = messages.cend();
        const auto N = static_cast<std::size_t>(std::distance(itMessage, itEnd));

        {
            Colour colourGuard(colour);
            stream << " with " << pluralise(N, "message") << ':';
        }

        while (itMessage != itEnd) {
            // If this assertion is a warning ignore any INFO messages
            if (printInfoMessages || itMessage->type != ResultWas::Info) {
                printMessage();
                if (itMessage != itEnd) {
                    Colour colourGuard(dimColour());
                    stream << " and";
                }
                continue;
            }
            ++itMessage;
        }
    }

private:
    std::ostream &stream;
    AssertionResult const &result;
    std::vector<MessageInfo> messages;
    std::vector<MessageInfo>::const_iterator itMessage;
    bool printInfoMessages;
};

}  // namespace

std::string CompactReporter::getDescription() {
    return "Reports test results on a single line, suitable for IDEs";
}

void CompactReporter::noMatchingTestCases(std::string const &spec) {
    stream << "No test cases matched '" << spec << '\'' << std::endl;
}

void CompactReporter::assertionStarting(AssertionInfo const &) {}

bool CompactReporter::assertionEnded(AssertionStats const &_assertionStats) {
    AssertionResult const &result = _assertionStats.assertionResult;

    bool printInfoMessages = true;

    // Drop out if result was successful and we're not printing those
    if (!m_config->includeSuccessfulResults() && result.isOk()) {
        if (result.getResultType() != ResultWas::Warning)
            return false;
        printInfoMessages = false;
    }

    AssertionPrinter printer(stream, _assertionStats, printInfoMessages);
    printer.print();

    stream << std::endl;
    return true;
}

void CompactReporter::sectionEnded(SectionStats const &_sectionStats) {
    double dur = _sectionStats.durationInSeconds;
    if (shouldShowDuration(*m_config, dur)) {
        stream << getFormattedDuration(dur) << " s: " << _sectionStats.sectionInfo.name
               << std::endl;
    }
}

void CompactReporter::testRunEnded(TestRunStats const &_testRunStats) {
    printTotals(stream, _testRunStats.totals);
    stream << '\n' << std::endl;
    StreamingReporterBase::testRunEnded(_testRunStats);
}

CompactReporter::~CompactReporter() {}

CATCH_REGISTER_REPORTER("compact", CompactReporter)

}  // end namespace Catch
// end catch_reporter_compact.cpp
// start catch_reporter_console.cpp

#include <cfloat>
#include <cstdio>

#if defined(_MSC_VER)
#pragma warning(push)
#pragma warning(disable : 4061)  // Not all labels are EXPLICITLY handled in switch
// Note that 4062 (not all labels are handled and default is missing) is
// enabled
#endif

#if defined(__clang__)
#pragma clang diagnostic push
// For simplicity, benchmarking-only helpers are always enabled
#pragma clang diagnostic ignored "-Wunused-function"
#endif

namespace Catch {

namespace {

// Formatter impl for ConsoleReporter
class ConsoleAssertionPrinter {
public:
    ConsoleAssertionPrinter &operator=(ConsoleAssertionPrinter const &) = delete;
    ConsoleAssertionPrinter(ConsoleAssertionPrinter const &) = delete;
    ConsoleAssertionPrinter(std::ostream &_stream,
                            AssertionStats const &_stats,
                            bool _printInfoMessages)
            : stream(_stream),
              stats(_stats),
              result(_stats.assertionResult),
              colour(Colour::None),
              message(result.getMessage()),
              messages(_stats.infoMessages),
              printInfoMessages(_printInfoMessages) {
        switch (result.getResultType()) {
        case ResultWas::Ok:
            colour = Colour::Success;
            passOrFail = "PASSED";
            // if( result.hasMessage() )
            if (_stats.infoMessages.size() == 1)
                messageLabel = "with message";
            if (_stats.infoMessages.size() > 1)
                messageLabel = "with messages";
            break;
        case ResultWas::ExpressionFailed:
            if (result.isOk()) {
                colour = Colour::Success;
                passOrFail = "FAILED - but was ok";
            } else {
                colour = Colour::Error;
                passOrFail = "FAILED";
            }
            if (_stats.infoMessages.size() == 1)
                messageLabel = "with message";
            if (_stats.infoMessages.size() > 1)
                messageLabel = "with messages";
            break;
        case ResultWas::ThrewException:
            colour = Colour::Error;
            passOrFail = "FAILED";
            messageLabel = "due to unexpected exception with ";
            if (_stats.infoMessages.size() == 1)
                messageLabel += "message";
            if (_stats.infoMessages.size() > 1)
                messageLabel += "messages";
            break;
        case ResultWas::FatalErrorCondition:
            colour = Colour::Error;
            passOrFail = "FAILED";
            messageLabel = "due to a fatal error condition";
            break;
        case ResultWas::DidntThrowException:
            colour = Colour::Error;
            passOrFail = "FAILED";
            messageLabel = "because no exception was thrown where one was expected";
            break;
        case ResultWas::Info:
            messageLabel = "info";
            break;
        case ResultWas::Warning:
            messageLabel = "warning";
            break;
        case ResultWas::ExplicitFailure:
            passOrFail = "FAILED";
            colour = Colour::Error;
            if (_stats.infoMessages.size() == 1)
                messageLabel = "explicitly with message";
            if (_stats.infoMessages.size() > 1)
                messageLabel = "explicitly with messages";
            break;
            // These cases are here to prevent compiler warnings
        case ResultWas::Unknown:
        case ResultWas::FailureBit:
        case ResultWas::Exception:
            passOrFail = "** internal error **";
            colour = Colour::Error;
            break;
        }
    }

    void print() const {
        printSourceInfo();
        if (stats.totals.assertions.total() > 0) {
            printResultType();
            printOriginalExpression();
            printReconstructedExpression();
        } else {
            stream << '\n';
        }
        printMessage();
    }

private:
    void printResultType() const {
        if (!passOrFail.empty()) {
            Colour colourGuard(colour);
            stream << passOrFail << ":\n";
        }
    }
    void printOriginalExpression() const {
        if (result.hasExpression()) {
            Colour colourGuard(Colour::OriginalExpression);
            stream << "  ";
            stream << result.getExpressionInMacro();
            stream << '\n';
        }
    }
    void printReconstructedExpression() const {
        if (result.hasExpandedExpression()) {
            stream << "with expansion:\n";
            Colour colourGuard(Colour::ReconstructedExpression);
            stream << Column(result.getExpandedExpression()).indent(2) << '\n';
        }
    }
    void printMessage() const {
        if (!messageLabel.empty())
            stream << messageLabel << ':' << '\n';
        for (auto const &msg : messages) {
            // If this assertion is a warning ignore any INFO messages
            if (printInfoMessages || msg.type != ResultWas::Info)
                stream << Column(msg.message).indent(2) << '\n';
        }
    }
    void printSourceInfo() const {
        Colour colourGuard(Colour::FileName);
        stream << result.getSourceInfo() << ": ";
    }

    std::ostream &stream;
    AssertionStats const &stats;
    AssertionResult const &result;
    Colour::Code colour;
    std::string passOrFail;
    std::string messageLabel;
    std::string message;
    std::vector<MessageInfo> messages;
    bool printInfoMessages;
};

std::size_t makeRatio(std::size_t number, std::size_t total) {
    std::size_t ratio = total > 0 ? CATCH_CONFIG_CONSOLE_WIDTH * number / total : 0;
    return (ratio == 0 && number > 0) ? 1 : ratio;
}

std::size_t &findMax(std::size_t &i, std::size_t &j, std::size_t &k) {
    if (i > j && i > k)
        return i;
    else if (j > k)
        return j;
    else
        return k;
}

struct ColumnInfo {
    enum Justification { Left, Right };
    std::string name;
    int width;
    Justification justification;
};
struct ColumnBreak {};
struct RowBreak {};

class Duration {
    enum class Unit { Auto, Nanoseconds, Microseconds, Milliseconds, Seconds, Minutes };
    static const uint64_t s_nanosecondsInAMicrosecond = 1000;
    static const uint64_t s_nanosecondsInAMillisecond = 1000 * s_nanosecondsInAMicrosecond;
    static const uint64_t s_nanosecondsInASecond = 1000 * s_nanosecondsInAMillisecond;
    static const uint64_t s_nanosecondsInAMinute = 60 * s_nanosecondsInASecond;

    double m_inNanoseconds;
    Unit m_units;

public:
    explicit Duration(double inNanoseconds, Unit units = Unit::Auto)
            : m_inNanoseconds(inNanoseconds), m_units(units) {
        if (m_units == Unit::Auto) {
            if (m_inNanoseconds < s_nanosecondsInAMicrosecond)
                m_units = Unit::Nanoseconds;
            else if (m_inNanoseconds < s_nanosecondsInAMillisecond)
                m_units = Unit::Microseconds;
            else if (m_inNanoseconds < s_nanosecondsInASecond)
                m_units = Unit::Milliseconds;
            else if (m_inNanoseconds < s_nanosecondsInAMinute)
                m_units = Unit::Seconds;
            else
                m_units = Unit::Minutes;
        }
    }

    auto value() const -> double {
        switch (m_units) {
        case Unit::Microseconds:
            return m_inNanoseconds / static_cast<double>(s_nanosecondsInAMicrosecond);
        case Unit::Milliseconds:
            return m_inNanoseconds / static_cast<double>(s_nanosecondsInAMillisecond);
        case Unit::Seconds:
            return m_inNanoseconds / static_cast<double>(s_nanosecondsInASecond);
        case Unit::Minutes:
            return m_inNanoseconds / static_cast<double>(s_nanosecondsInAMinute);
        default:
            return m_inNanoseconds;
        }
    }
    auto unitsAsString() const -> std::string {
        switch (m_units) {
        case Unit::Nanoseconds:
            return "ns";
        case Unit::Microseconds:
            return "us";
        case Unit::Milliseconds:
            return "ms";
        case Unit::Seconds:
            return "s";
        case Unit::Minutes:
            return "m";
        default:
            return "** internal error **";
        }
    }
    friend auto operator<<(std::ostream &os, Duration const &duration) -> std::ostream & {
        return os << duration.value() << ' ' << duration.unitsAsString();
    }
};
}  // namespace

class TablePrinter {
    std::ostream &m_os;
    std::vector<ColumnInfo> m_columnInfos;
    std::ostringstream m_oss;
    int m_currentColumn = -1;
    bool m_isOpen = false;

public:
    TablePrinter(std::ostream &os, std::vector<ColumnInfo> columnInfos)
            : m_os(os), m_columnInfos(std::move(columnInfos)) {}

    auto columnInfos() const -> std::vector<ColumnInfo> const & { return m_columnInfos; }

    void open() {
        if (!m_isOpen) {
            m_isOpen = true;
            *this << RowBreak();

            Columns headerCols;
            Spacer spacer(2);
            for (auto const &info : m_columnInfos) {
                headerCols += Column(info.name).width(static_cast<std::size_t>(info.width - 2));
                headerCols += spacer;
            }
            m_os << headerCols << '\n';

            m_os << Catch::getLineOfChars<'-'>() << '\n';
        }
    }
    void close() {
        if (m_isOpen) {
            *this << RowBreak();
            m_os << std::endl;
            m_isOpen = false;
        }
    }

    template <typename T>
    friend TablePrinter &operator<<(TablePrinter &tp, T const &value) {
        tp.m_oss << value;
        return tp;
    }

    friend TablePrinter &operator<<(TablePrinter &tp, ColumnBreak) {
        auto colStr = tp.m_oss.str();
        const auto strSize = colStr.size();
        tp.m_oss.str("");
        tp.open();
        if (tp.m_currentColumn == static_cast<int>(tp.m_columnInfos.size() - 1)) {
            tp.m_currentColumn = -1;
            tp.m_os << '\n';
        }
        tp.m_currentColumn++;

        auto colInfo = tp.m_columnInfos[tp.m_currentColumn];
        auto padding = (strSize + 1 < static_cast<std::size_t>(colInfo.width))
                               ? std::string(colInfo.width - (strSize + 1), ' ')
                               : std::string();
        if (colInfo.justification == ColumnInfo::Left)
            tp.m_os << colStr << padding << ' ';
        else
            tp.m_os << padding << colStr << ' ';
        return tp;
    }

    friend TablePrinter &operator<<(TablePrinter &tp, RowBreak) {
        if (tp.m_currentColumn > 0) {
            tp.m_os << '\n';
            tp.m_currentColumn = -1;
        }
        return tp;
    }
};

ConsoleReporter::ConsoleReporter(ReporterConfig const &config)
        : StreamingReporterBase(config),
          m_tablePrinter(new TablePrinter(config.stream(), [&config]() -> std::vector<ColumnInfo> {
              if (config.fullConfig()->benchmarkNoAnalysis()) {
                  return {{"benchmark name", CATCH_CONFIG_CONSOLE_WIDTH - 43, ColumnInfo::Left},
                          {"     samples", 14, ColumnInfo::Right},
                          {"  iterations", 14, ColumnInfo::Right},
                          {"        mean", 14, ColumnInfo::Right}};
              } else {
                  return {{"benchmark name", CATCH_CONFIG_CONSOLE_WIDTH - 43, ColumnInfo::Left},
                          {"samples      mean       std dev", 14, ColumnInfo::Right},
                          {"iterations   low mean   low std dev", 14, ColumnInfo::Right},
                          {"estimated    high mean  high std dev", 14, ColumnInfo::Right}};
              }
          }())) {}
ConsoleReporter::~ConsoleReporter() = default;

std::string ConsoleReporter::getDescription() {
    return "Reports test results as plain lines of text";
}

void ConsoleReporter::noMatchingTestCases(std::string const &spec) {
    stream << "No test cases matched '" << spec << '\'' << std::endl;
}

void ConsoleReporter::reportInvalidArguments(std::string const &arg) {
    stream << "Invalid Filter: " << arg << std::endl;
}

void ConsoleReporter::assertionStarting(AssertionInfo const &) {}

bool ConsoleReporter::assertionEnded(AssertionStats const &_assertionStats) {
    AssertionResult const &result = _assertionStats.assertionResult;

    bool includeResults = m_config->includeSuccessfulResults() || !result.isOk();

    // Drop out if result was successful but we're not printing them.
    if (!includeResults && result.getResultType() != ResultWas::Warning)
        return false;

    lazyPrint();

    ConsoleAssertionPrinter printer(stream, _assertionStats, includeResults);
    printer.print();
    stream << std::endl;
    return true;
}

void ConsoleReporter::sectionStarting(SectionInfo const &_sectionInfo) {
    m_tablePrinter->close();
    m_headerPrinted = false;
    StreamingReporterBase::sectionStarting(_sectionInfo);
}
void ConsoleReporter::sectionEnded(SectionStats const &_sectionStats) {
    m_tablePrinter->close();
    if (_sectionStats.missingAssertions) {
        lazyPrint();
        Colour colour(Colour::ResultError);
        if (m_sectionStack.size() > 1)
            stream << "\nNo assertions in section";
        else
            stream << "\nNo assertions in test case";
        stream << " '" << _sectionStats.sectionInfo.name << "'\n" << std::endl;
    }
    double dur = _sectionStats.durationInSeconds;
    if (shouldShowDuration(*m_config, dur)) {
        stream << getFormattedDuration(dur) << " s: " << _sectionStats.sectionInfo.name
               << std::endl;
    }
    if (m_headerPrinted) {
        m_headerPrinted = false;
    }
    StreamingReporterBase::sectionEnded(_sectionStats);
}

#if defined(CATCH_CONFIG_ENABLE_BENCHMARKING)
void ConsoleReporter::benchmarkPreparing(std::string const &name) {
    lazyPrintWithoutClosingBenchmarkTable();

    auto nameCol = Column(name).width(
            static_cast<std::size_t>(m_tablePrinter->columnInfos()[0].width - 2));

    bool firstLine = true;
    for (auto line : nameCol) {
        if (!firstLine)
            (*m_tablePrinter) << ColumnBreak() << ColumnBreak() << ColumnBreak();
        else
            firstLine = false;

        (*m_tablePrinter) << line << ColumnBreak();
    }
}

void ConsoleReporter::benchmarkStarting(BenchmarkInfo const &info) {
    (*m_tablePrinter) << info.samples << ColumnBreak() << info.iterations << ColumnBreak();
    if (!m_config->benchmarkNoAnalysis())
        (*m_tablePrinter) << Duration(info.estimatedDuration) << ColumnBreak();
}
void ConsoleReporter::benchmarkEnded(BenchmarkStats<> const &stats) {
    if (m_config->benchmarkNoAnalysis()) {
        (*m_tablePrinter) << Duration(stats.mean.point.count()) << ColumnBreak();
    } else {
        (*m_tablePrinter) << ColumnBreak() << Duration(stats.mean.point.count()) << ColumnBreak()
                          << Duration(stats.mean.lower_bound.count()) << ColumnBreak()
                          << Duration(stats.mean.upper_bound.count()) << ColumnBreak()
                          << ColumnBreak() << Duration(stats.standardDeviation.point.count())
                          << ColumnBreak() << Duration(stats.standardDeviation.lower_bound.count())
                          << ColumnBreak() << Duration(stats.standardDeviation.upper_bound.count())
                          << ColumnBreak() << ColumnBreak() << ColumnBreak() << ColumnBreak()
                          << ColumnBreak();
    }
}

void ConsoleReporter::benchmarkFailed(std::string const &error) {
    Colour colour(Colour::Red);
    (*m_tablePrinter) << "Benchmark failed (" << error << ')' << ColumnBreak() << RowBreak();
}
#endif  // CATCH_CONFIG_ENABLE_BENCHMARKING

void ConsoleReporter::testCaseEnded(TestCaseStats const &_testCaseStats) {
    m_tablePrinter->close();
    StreamingReporterBase::testCaseEnded(_testCaseStats);
    m_headerPrinted = false;
}
void ConsoleReporter::testGroupEnded(TestGroupStats const &_testGroupStats) {
    if (currentGroupInfo.used) {
        printSummaryDivider();
        stream << "Summary for group '" << _testGroupStats.groupInfo.name << "':\n";
        printTotals(_testGroupStats.totals);
        stream << '\n' << std::endl;
    }
    StreamingReporterBase::testGroupEnded(_testGroupStats);
}
void ConsoleReporter::testRunEnded(TestRunStats const &_testRunStats) {
    printTotalsDivider(_testRunStats.totals);
    printTotals(_testRunStats.totals);
    stream << std::endl;
    StreamingReporterBase::testRunEnded(_testRunStats);
}
void ConsoleReporter::testRunStarting(TestRunInfo const &_testInfo) {
    StreamingReporterBase::testRunStarting(_testInfo);
    printTestFilters();
}

void ConsoleReporter::lazyPrint() {
    m_tablePrinter->close();
    lazyPrintWithoutClosingBenchmarkTable();
}

void ConsoleReporter::lazyPrintWithoutClosingBenchmarkTable() {
    if (!currentTestRunInfo.used)
        lazyPrintRunInfo();
    if (!currentGroupInfo.used)
        lazyPrintGroupInfo();

    if (!m_headerPrinted) {
        printTestCaseAndSectionHeader();
        m_headerPrinted = true;
    }
}
void ConsoleReporter::lazyPrintRunInfo() {
    stream << '\n' << getLineOfChars<'~'>() << '\n';
    Colour colour(Colour::SecondaryText);
    stream << currentTestRunInfo->name << " is a Catch v" << libraryVersion()
           << " host application.\n"
           << "Run with -? for options\n\n";

    if (m_config->rngSeed() != 0)
        stream << "Randomness seeded to: " << m_config->rngSeed() << "\n\n";

    currentTestRunInfo.used = true;
}
void ConsoleReporter::lazyPrintGroupInfo() {
    if (!currentGroupInfo->name.empty() && currentGroupInfo->groupsCounts > 1) {
        printClosedHeader("Group: " + currentGroupInfo->name);
        currentGroupInfo.used = true;
    }
}
void ConsoleReporter::printTestCaseAndSectionHeader() {
    assert(!m_sectionStack.empty());
    printOpenHeader(currentTestCaseInfo->name);

    if (m_sectionStack.size() > 1) {
        Colour colourGuard(Colour::Headers);

        auto it = m_sectionStack.begin() + 1,  // Skip first section (test case)
                itEnd = m_sectionStack.end();
        for (; it != itEnd; ++it)
            printHeaderString(it->name, 2);
    }

    SourceLineInfo lineInfo = m_sectionStack.back().lineInfo;

    stream << getLineOfChars<'-'>() << '\n';
    Colour colourGuard(Colour::FileName);
    stream << lineInfo << '\n';
    stream << getLineOfChars<'.'>() << '\n' << std::endl;
}

void ConsoleReporter::printClosedHeader(std::string const &_name) {
    printOpenHeader(_name);
    stream << getLineOfChars<'.'>() << '\n';
}
void ConsoleReporter::printOpenHeader(std::string const &_name) {
    stream << getLineOfChars<'-'>() << '\n';
    {
        Colour colourGuard(Colour::Headers);
        printHeaderString(_name);
    }
}

// if string has a : in first line will set indent to follow it on
// subsequent lines
void ConsoleReporter::printHeaderString(std::string const &_string, std::size_t indent) {
    std::size_t i = _string.find(": ");
    if (i != std::string::npos)
        i += 2;
    else
        i = 0;
    stream << Column(_string).indent(indent + i).initialIndent(indent) << '\n';
}

struct SummaryColumn {
    SummaryColumn(std::string _label, Colour::Code _colour)
            : label(std::move(_label)), colour(_colour) {}
    SummaryColumn addRow(std::size_t count) {
        ReusableStringStream rss;
        rss << count;
        std::string row = rss.str();
        for (auto &oldRow : rows) {
            while (oldRow.size() < row.size())
                oldRow = ' ' + oldRow;
            while (oldRow.size() > row.size())
                row = ' ' + row;
        }
        rows.push_back(row);
        return *this;
    }

    std::string label;
    Colour::Code colour;
    std::vector<std::string> rows;
};

void ConsoleReporter::printTotals(Totals const &totals) {
    if (totals.testCases.total() == 0) {
        stream << Colour(Colour::Warning) << "No tests ran\n";
    } else if (totals.assertions.total() > 0 && totals.testCases.allPassed()) {
        stream << Colour(Colour::ResultSuccess) << "All tests passed";
        stream << " (" << pluralise(totals.assertions.passed, "assertion") << " in "
               << pluralise(totals.testCases.passed, "test case") << ')' << '\n';
    } else {
        std::vector<SummaryColumn> columns;
        columns.push_back(SummaryColumn("", Colour::None)
                                  .addRow(totals.testCases.total())
                                  .addRow(totals.assertions.total()));
        columns.push_back(SummaryColumn("passed", Colour::Success)
                                  .addRow(totals.testCases.passed)
                                  .addRow(totals.assertions.passed));
        columns.push_back(SummaryColumn("failed", Colour::ResultError)
                                  .addRow(totals.testCases.failed)
                                  .addRow(totals.assertions.failed));
        columns.push_back(SummaryColumn("failed as expected", Colour::ResultExpectedFailure)
                                  .addRow(totals.testCases.failedButOk)
                                  .addRow(totals.assertions.failedButOk));

        printSummaryRow("test cases", columns, 0);
        printSummaryRow("assertions", columns, 1);
    }
}
void ConsoleReporter::printSummaryRow(std::string const &label,
                                      std::vector<SummaryColumn> const &cols,
                                      std::size_t row) {
    for (auto col : cols) {
        std::string value = col.rows[row];
        if (col.label.empty()) {
            stream << label << ": ";
            if (value != "0")
                stream << value;
            else
                stream << Colour(Colour::Warning) << "- none -";
        } else if (value != "0") {
            stream << Colour(Colour::LightGrey) << " | ";
            stream << Colour(col.colour) << value << ' ' << col.label;
        }
    }
    stream << '\n';
}

void ConsoleReporter::printTotalsDivider(Totals const &totals) {
    if (totals.testCases.total() > 0) {
        std::size_t failedRatio = makeRatio(totals.testCases.failed, totals.testCases.total());
        std::size_t failedButOkRatio =
                makeRatio(totals.testCases.failedButOk, totals.testCases.total());
        std::size_t passedRatio = makeRatio(totals.testCases.passed, totals.testCases.total());
        while (failedRatio + failedButOkRatio + passedRatio < CATCH_CONFIG_CONSOLE_WIDTH - 1)
            findMax(failedRatio, failedButOkRatio, passedRatio)++;
        while (failedRatio + failedButOkRatio + passedRatio > CATCH_CONFIG_CONSOLE_WIDTH - 1)
            findMax(failedRatio, failedButOkRatio, passedRatio)--;

        stream << Colour(Colour::Error) << std::string(failedRatio, '=');
        stream << Colour(Colour::ResultExpectedFailure) << std::string(failedButOkRatio, '=');
        if (totals.testCases.allPassed())
            stream << Colour(Colour::ResultSuccess) << std::string(passedRatio, '=');
        else
            stream << Colour(Colour::Success) << std::string(passedRatio, '=');
    } else {
        stream << Colour(Colour::Warning) << std::string(CATCH_CONFIG_CONSOLE_WIDTH - 1, '=');
    }
    stream << '\n';
}
void ConsoleReporter::printSummaryDivider() { stream << getLineOfChars<'-'>() << '\n'; }

void ConsoleReporter::printTestFilters() {
    if (m_config->testSpec().hasFilters()) {
        Colour guard(Colour::BrightYellow);
        stream << "Filters: " << serializeFilters(m_config->getTestsOrTags()) << '\n';
    }
}

CATCH_REGISTER_REPORTER("console", ConsoleReporter)

}  // end namespace Catch

#if defined(_MSC_VER)
#pragma warning(pop)
#endif

#if defined(__clang__)
#pragma clang diagnostic pop
#endif
// end catch_reporter_console.cpp
// start catch_reporter_junit.cpp

#include <algorithm>
#include <cassert>
#include <ctime>
#include <iomanip>
#include <sstream>

namespace Catch {

namespace {
std::string getCurrentTimestamp() {
    // Beware, this is not reentrant because of backward compatibility issues
    // Also, UTC only, again because of backward compatibility (%z is C++11)
    time_t rawtime;
    std::time(&rawtime);
    auto const timeStampSize = sizeof("2017-01-16T17:06:45Z");

#ifdef _MSC_VER
    std::tm timeInfo = {};
    gmtime_s(&timeInfo, &rawtime);
#else
    std::tm *timeInfo;
    timeInfo = std::gmtime(&rawtime);
#endif

    char timeStamp[timeStampSize];
    const char *const fmt = "%Y-%m-%dT%H:%M:%SZ";

#ifdef _MSC_VER
    std::strftime(timeStamp, timeStampSize, fmt, &timeInfo);
#else
    std::strftime(timeStamp, timeStampSize, fmt, timeInfo);
#endif
    return std::string(timeStamp, timeStampSize - 1);
}

std::string fileNameTag(const std::vector<std::string> &tags) {
    auto it = std::find_if(begin(tags), end(tags),
                           [](std::string const &tag) { return tag.front() == '#'; });
    if (it != tags.end())
        return it->substr(1);
    return std::string();
}

// Formats the duration in seconds to 3 decimal places.
// This is done because some genius defined Maven Surefire schema
// in a way that only accepts 3 decimal places, and tools like
// Jenkins use that schema for validation JUnit reporter output.
std::string formatDuration(double seconds) {
    ReusableStringStream rss;
    rss << std::fixed << std::setprecision(3) << seconds;
    return rss.str();
}

}  // anonymous namespace

JunitReporter::JunitReporter(ReporterConfig const &_config)
        : CumulativeReporterBase(_config), xml(_config.stream()) {
    m_reporterPrefs.shouldRedirectStdOut = true;
    m_reporterPrefs.shouldReportAllAssertions = true;
}

JunitReporter::~JunitReporter() {}

std::string JunitReporter::getDescription() {
    return "Reports test results in an XML format that looks like Ant's "
           "junitreport target";
}

void JunitReporter::noMatchingTestCases(std::string const & /*spec*/) {}

void JunitReporter::testRunStarting(TestRunInfo const &runInfo) {
    CumulativeReporterBase::testRunStarting(runInfo);
    xml.startElement("testsuites");
}

void JunitReporter::testGroupStarting(GroupInfo const &groupInfo) {
    suiteTimer.start();
    stdOutForSuite.clear();
    stdErrForSuite.clear();
    unexpectedExceptions = 0;
    CumulativeReporterBase::testGroupStarting(groupInfo);
}

void JunitReporter::testCaseStarting(TestCaseInfo const &testCaseInfo) {
    m_okToFail = testCaseInfo.okToFail();
}

bool JunitReporter::assertionEnded(AssertionStats const &assertionStats) {
    if (assertionStats.assertionResult.getResultType() == ResultWas::ThrewException && !m_okToFail)
        unexpectedExceptions++;
    return CumulativeReporterBase::assertionEnded(assertionStats);
}

void JunitReporter::testCaseEnded(TestCaseStats const &testCaseStats) {
    stdOutForSuite += testCaseStats.stdOut;
    stdErrForSuite += testCaseStats.stdErr;
    CumulativeReporterBase::testCaseEnded(testCaseStats);
}

void JunitReporter::testGroupEnded(TestGroupStats const &testGroupStats) {
    double suiteTime = suiteTimer.getElapsedSeconds();
    CumulativeReporterBase::testGroupEnded(testGroupStats);
    writeGroup(*m_testGroups.back(), suiteTime);
}

void JunitReporter::testRunEndedCumulative() { xml.endElement(); }

void JunitReporter::writeGroup(TestGroupNode const &groupNode, double suiteTime) {
    XmlWriter::ScopedElement e = xml.scopedElement("testsuite");

    TestGroupStats const &stats = groupNode.value;
    xml.writeAttribute("name", stats.groupInfo.name);
    xml.writeAttribute("errors", unexpectedExceptions);
    xml.writeAttribute("failures", stats.totals.assertions.failed - unexpectedExceptions);
    xml.writeAttribute("tests", stats.totals.assertions.total());
    xml.writeAttribute("hostname", "tbd");  // !TBD
    if (m_config->showDurations() == ShowDurations::Never)
        xml.writeAttribute("time", "");
    else
        xml.writeAttribute("time", formatDuration(suiteTime));
    xml.writeAttribute("timestamp", getCurrentTimestamp());

    // Write properties if there are any
    if (m_config->hasTestFilters() || m_config->rngSeed() != 0) {
        auto properties = xml.scopedElement("properties");
        if (m_config->hasTestFilters()) {
            xml.scopedElement("property")
                    .writeAttribute("name", "filters")
                    .writeAttribute("value", serializeFilters(m_config->getTestsOrTags()));
        }
        if (m_config->rngSeed() != 0) {
            xml.scopedElement("property")
                    .writeAttribute("name", "random-seed")
                    .writeAttribute("value", m_config->rngSeed());
        }
    }

    // Write test cases
    for (auto const &child : groupNode.children)
        writeTestCase(*child);

    xml.scopedElement("system-out").writeText(trim(stdOutForSuite), XmlFormatting::Newline);
    xml.scopedElement("system-err").writeText(trim(stdErrForSuite), XmlFormatting::Newline);
}

void JunitReporter::writeTestCase(TestCaseNode const &testCaseNode) {
    TestCaseStats const &stats = testCaseNode.value;

    // All test cases have exactly one section - which represents the
    // test case itself. That section may have 0-n nested sections
    assert(testCaseNode.children.size() == 1);
    SectionNode const &rootSection = *testCaseNode.children.front();

    std::string className = stats.testInfo.className;

    if (className.empty()) {
        className = fileNameTag(stats.testInfo.tags);
        if (className.empty())
            className = "global";
    }

    if (!m_config->name().empty())
        className = m_config->name() + "." + className;

    writeSection(className, "", rootSection, stats.testInfo.okToFail());
}

void JunitReporter::writeSection(std::string const &className,
                                 std::string const &rootName,
                                 SectionNode const &sectionNode,
                                 bool testOkToFail) {
    std::string name = trim(sectionNode.stats.sectionInfo.name);
    if (!rootName.empty())
        name = rootName + '/' + name;

    if (!sectionNode.assertions.empty() || !sectionNode.stdOut.empty() ||
        !sectionNode.stdErr.empty()) {
        XmlWriter::ScopedElement e = xml.scopedElement("testcase");
        if (className.empty()) {
            xml.writeAttribute("classname", name);
            xml.writeAttribute("name", "root");
        } else {
            xml.writeAttribute("classname", className);
            xml.writeAttribute("name", name);
        }
        xml.writeAttribute("time", formatDuration(sectionNode.stats.durationInSeconds));
        // This is not ideal, but it should be enough to mimic gtest's
        // junit output.
        // Ideally the JUnit reporter would also handle `skipTest`
        // events and write those out appropriately.
        xml.writeAttribute("status", "run");

        if (sectionNode.stats.assertions.failedButOk) {
            xml.scopedElement("skipped").writeAttribute("message",
                                                        "TEST_CASE tagged with !mayfail");
        }

        writeAssertions(sectionNode);

        if (!sectionNode.stdOut.empty())
            xml.scopedElement("system-out")
                    .writeText(trim(sectionNode.stdOut), XmlFormatting::Newline);
        if (!sectionNode.stdErr.empty())
            xml.scopedElement("system-err")
                    .writeText(trim(sectionNode.stdErr), XmlFormatting::Newline);
    }
    for (auto const &childNode : sectionNode.childSections)
        if (className.empty())
            writeSection(name, "", *childNode, testOkToFail);
        else
            writeSection(className, name, *childNode, testOkToFail);
}

void JunitReporter::writeAssertions(SectionNode const &sectionNode) {
    for (auto const &assertion : sectionNode.assertions)
        writeAssertion(assertion);
}

void JunitReporter::writeAssertion(AssertionStats const &stats) {
    AssertionResult const &result = stats.assertionResult;
    if (!result.isOk()) {
        std::string elementName;
        switch (result.getResultType()) {
        case ResultWas::ThrewException:
        case ResultWas::FatalErrorCondition:
            elementName = "error";
            break;
        case ResultWas::ExplicitFailure:
        case ResultWas::ExpressionFailed:
        case ResultWas::DidntThrowException:
            elementName = "failure";
            break;

        // We should never see these here:
        case ResultWas::Info:
        case ResultWas::Warning:
        case ResultWas::Ok:
        case ResultWas::Unknown:
        case ResultWas::FailureBit:
        case ResultWas::Exception:
            elementName = "internalError";
            break;
        }

        XmlWriter::ScopedElement e = xml.scopedElement(elementName);

        xml.writeAttribute("message", result.getExpression());
        xml.writeAttribute("type", result.getTestMacroName());

        ReusableStringStream rss;
        if (stats.totals.assertions.total() > 0) {
            rss << "FAILED"
                << ":\n";
            if (result.hasExpression()) {
                rss << "  ";
                rss << result.getExpressionInMacro();
                rss << '\n';
            }
            if (result.hasExpandedExpression()) {
                rss << "with expansion:\n";
                rss << Column(result.getExpandedExpression()).indent(2) << '\n';
            }
        } else {
            rss << '\n';
        }

        if (!result.getMessage().empty())
            rss << result.getMessage() << '\n';
        for (auto const &msg : stats.infoMessages)
            if (msg.type == ResultWas::Info)
                rss << msg.message << '\n';

        rss << "at " << result.getSourceInfo();
        xml.writeText(rss.str(), XmlFormatting::Newline);
    }
}

CATCH_REGISTER_REPORTER("junit", JunitReporter)

}  // end namespace Catch
// end catch_reporter_junit.cpp
// start catch_reporter_listening.cpp

#include <cassert>

namespace Catch {

ListeningReporter::ListeningReporter() {
    // We will assume that listeners will always want all assertions
    m_preferences.shouldReportAllAssertions = true;
}

void ListeningReporter::addListener(IStreamingReporterPtr &&listener) {
    m_listeners.push_back(std::move(listener));
}

void ListeningReporter::addReporter(IStreamingReporterPtr &&reporter) {
    assert(!m_reporter && "Listening reporter can wrap only 1 real reporter");
    m_reporter = std::move(reporter);
    m_preferences.shouldRedirectStdOut = m_reporter->getPreferences().shouldRedirectStdOut;
}

ReporterPreferences ListeningReporter::getPreferences() const { return m_preferences; }

std::set<Verbosity> ListeningReporter::getSupportedVerbosities() { return std::set<Verbosity>{}; }

void ListeningReporter::noMatchingTestCases(std::string const &spec) {
    for (auto const &listener : m_listeners) {
        listener->noMatchingTestCases(spec);
    }
    m_reporter->noMatchingTestCases(spec);
}

void ListeningReporter::reportInvalidArguments(std::string const &arg) {
    for (auto const &listener : m_listeners) {
        listener->reportInvalidArguments(arg);
    }
    m_reporter->reportInvalidArguments(arg);
}

#if defined(CATCH_CONFIG_ENABLE_BENCHMARKING)
void ListeningReporter::benchmarkPreparing(std::string const &name) {
    for (auto const &listener : m_listeners) {
        listener->benchmarkPreparing(name);
    }
    m_reporter->benchmarkPreparing(name);
}
void ListeningReporter::benchmarkStarting(BenchmarkInfo const &benchmarkInfo) {
    for (auto const &listener : m_listeners) {
        listener->benchmarkStarting(benchmarkInfo);
    }
    m_reporter->benchmarkStarting(benchmarkInfo);
}
void ListeningReporter::benchmarkEnded(BenchmarkStats<> const &benchmarkStats) {
    for (auto const &listener : m_listeners) {
        listener->benchmarkEnded(benchmarkStats);
    }
    m_reporter->benchmarkEnded(benchmarkStats);
}

void ListeningReporter::benchmarkFailed(std::string const &error) {
    for (auto const &listener : m_listeners) {
        listener->benchmarkFailed(error);
    }
    m_reporter->benchmarkFailed(error);
}
#endif  // CATCH_CONFIG_ENABLE_BENCHMARKING

void ListeningReporter::testRunStarting(TestRunInfo const &testRunInfo) {
    for (auto const &listener : m_listeners) {
        listener->testRunStarting(testRunInfo);
    }
    m_reporter->testRunStarting(testRunInfo);
}

void ListeningReporter::testGroupStarting(GroupInfo const &groupInfo) {
    for (auto const &listener : m_listeners) {
        listener->testGroupStarting(groupInfo);
    }
    m_reporter->testGroupStarting(groupInfo);
}

void ListeningReporter::testCaseStarting(TestCaseInfo const &testInfo) {
    for (auto const &listener : m_listeners) {
        listener->testCaseStarting(testInfo);
    }
    m_reporter->testCaseStarting(testInfo);
}

void ListeningReporter::sectionStarting(SectionInfo const &sectionInfo) {
    for (auto const &listener : m_listeners) {
        listener->sectionStarting(sectionInfo);
    }
    m_reporter->sectionStarting(sectionInfo);
}

void ListeningReporter::assertionStarting(AssertionInfo const &assertionInfo) {
    for (auto const &listener : m_listeners) {
        listener->assertionStarting(assertionInfo);
    }
    m_reporter->assertionStarting(assertionInfo);
}

// The return value indicates if the messages buffer should be cleared:
bool ListeningReporter::assertionEnded(AssertionStats const &assertionStats) {
    for (auto const &listener : m_listeners) {
        static_cast<void>(listener->assertionEnded(assertionStats));
    }
    return m_reporter->assertionEnded(assertionStats);
}

void ListeningReporter::sectionEnded(SectionStats const &sectionStats) {
    for (auto const &listener : m_listeners) {
        listener->sectionEnded(sectionStats);
    }
    m_reporter->sectionEnded(sectionStats);
}

void ListeningReporter::testCaseEnded(TestCaseStats const &testCaseStats) {
    for (auto const &listener : m_listeners) {
        listener->testCaseEnded(testCaseStats);
    }
    m_reporter->testCaseEnded(testCaseStats);
}

void ListeningReporter::testGroupEnded(TestGroupStats const &testGroupStats) {
    for (auto const &listener : m_listeners) {
        listener->testGroupEnded(testGroupStats);
    }
    m_reporter->testGroupEnded(testGroupStats);
}

void ListeningReporter::testRunEnded(TestRunStats const &testRunStats) {
    for (auto const &listener : m_listeners) {
        listener->testRunEnded(testRunStats);
    }
    m_reporter->testRunEnded(testRunStats);
}

void ListeningReporter::skipTest(TestCaseInfo const &testInfo) {
    for (auto const &listener : m_listeners) {
        listener->skipTest(testInfo);
    }
    m_reporter->skipTest(testInfo);
}

bool ListeningReporter::isMulti() const { return true; }

}  // end namespace Catch
// end catch_reporter_listening.cpp
// start catch_reporter_xml.cpp

#if defined(_MSC_VER)
#pragma warning(push)
#pragma warning(disable : 4061)  // Not all labels are EXPLICITLY handled in  \
                                 // switch Note that 4062 (not all labels are \
                                 // handled and default is missing) is enabled
#endif

namespace Catch {
XmlReporter::XmlReporter(ReporterConfig const &_config)
        : StreamingReporterBase(_config), m_xml(_config.stream()) {
    m_reporterPrefs.shouldRedirectStdOut = true;
    m_reporterPrefs.shouldReportAllAssertions = true;
}

XmlReporter::~XmlReporter() = default;

std::string XmlReporter::getDescription() { return "Reports test results as an XML document"; }

std::string XmlReporter::getStylesheetRef() const { return std::string(); }

void XmlReporter::writeSourceInfo(SourceLineInfo const &sourceInfo) {
    m_xml.writeAttribute("filename", sourceInfo.file).writeAttribute("line", sourceInfo.line);
}

void XmlReporter::noMatchingTestCases(std::string const &s) {
    StreamingReporterBase::noMatchingTestCases(s);
}

void XmlReporter::testRunStarting(TestRunInfo const &testInfo) {
    StreamingReporterBase::testRunStarting(testInfo);
    std::string stylesheetRef = getStylesheetRef();
    if (!stylesheetRef.empty())
        m_xml.writeStylesheetRef(stylesheetRef);
    m_xml.startElement("Catch");
    if (!m_config->name().empty())
        m_xml.writeAttribute("name", m_config->name());
    if (m_config->testSpec().hasFilters())
        m_xml.writeAttribute("filters", serializeFilters(m_config->getTestsOrTags()));
    if (m_config->rngSeed() != 0)
        m_xml.scopedElement("Randomness").writeAttribute("seed", m_config->rngSeed());
}

void XmlReporter::testGroupStarting(GroupInfo const &groupInfo) {
    StreamingReporterBase::testGroupStarting(groupInfo);
    m_xml.startElement("Group").writeAttribute("name", groupInfo.name);
}

void XmlReporter::testCaseStarting(TestCaseInfo const &testInfo) {
    StreamingReporterBase::testCaseStarting(testInfo);
    m_xml.startElement("TestCase")
            .writeAttribute("name", trim(testInfo.name))
            .writeAttribute("description", testInfo.description)
            .writeAttribute("tags", testInfo.tagsAsString());

    writeSourceInfo(testInfo.lineInfo);

    if (m_config->showDurations() == ShowDurations::Always)
        m_testCaseTimer.start();
    m_xml.ensureTagClosed();
}

void XmlReporter::sectionStarting(SectionInfo const &sectionInfo) {
    StreamingReporterBase::sectionStarting(sectionInfo);
    if (m_sectionDepth++ > 0) {
        m_xml.startElement("Section").writeAttribute("name", trim(sectionInfo.name));
        writeSourceInfo(sectionInfo.lineInfo);
        m_xml.ensureTagClosed();
    }
}

void XmlReporter::assertionStarting(AssertionInfo const &) {}

bool XmlReporter::assertionEnded(AssertionStats const &assertionStats) {
    AssertionResult const &result = assertionStats.assertionResult;

    bool includeResults = m_config->includeSuccessfulResults() || !result.isOk();

    if (includeResults || result.getResultType() == ResultWas::Warning) {
        // Print any info messages in <Info> tags.
        for (auto const &msg : assertionStats.infoMessages) {
            if (msg.type == ResultWas::Info && includeResults) {
                m_xml.scopedElement("Info").writeText(msg.message);
            } else if (msg.type == ResultWas::Warning) {
                m_xml.scopedElement("Warning").writeText(msg.message);
            }
        }
    }

    // Drop out if result was successful but we're not printing them.
    if (!includeResults && result.getResultType() != ResultWas::Warning)
        return true;

    // Print the expression if there is one.
    if (result.hasExpression()) {
        m_xml.startElement("Expression")
                .writeAttribute("success", result.succeeded())
                .writeAttribute("type", result.getTestMacroName());

        writeSourceInfo(result.getSourceInfo());

        m_xml.scopedElement("Original").writeText(result.getExpression());
        m_xml.scopedElement("Expanded").writeText(result.getExpandedExpression());
    }

    // And... Print a result applicable to each result type.
    switch (result.getResultType()) {
    case ResultWas::ThrewException:
        m_xml.startElement("Exception");
        writeSourceInfo(result.getSourceInfo());
        m_xml.writeText(result.getMessage());
        m_xml.endElement();
        break;
    case ResultWas::FatalErrorCondition:
        m_xml.startElement("FatalErrorCondition");
        writeSourceInfo(result.getSourceInfo());
        m_xml.writeText(result.getMessage());
        m_xml.endElement();
        break;
    case ResultWas::Info:
        m_xml.scopedElement("Info").writeText(result.getMessage());
        break;
    case ResultWas::Warning:
        // Warning will already have been written
        break;
    case ResultWas::ExplicitFailure:
        m_xml.startElement("Failure");
        writeSourceInfo(result.getSourceInfo());
        m_xml.writeText(result.getMessage());
        m_xml.endElement();
        break;
    default:
        break;
    }

    if (result.hasExpression())
        m_xml.endElement();

    return true;
}

void XmlReporter::sectionEnded(SectionStats const &sectionStats) {
    StreamingReporterBase::sectionEnded(sectionStats);
    if (--m_sectionDepth > 0) {
        XmlWriter::ScopedElement e = m_xml.scopedElement("OverallResults");
        e.writeAttribute("successes", sectionStats.assertions.passed);
        e.writeAttribute("failures", sectionStats.assertions.failed);
        e.writeAttribute("expectedFailures", sectionStats.assertions.failedButOk);

        if (m_config->showDurations() == ShowDurations::Always)
            e.writeAttribute("durationInSeconds", sectionStats.durationInSeconds);

        m_xml.endElement();
    }
}

void XmlReporter::testCaseEnded(TestCaseStats const &testCaseStats) {
    StreamingReporterBase::testCaseEnded(testCaseStats);
    XmlWriter::ScopedElement e = m_xml.scopedElement("OverallResult");
    e.writeAttribute("success", testCaseStats.totals.assertions.allOk());

    if (m_config->showDurations() == ShowDurations::Always)
        e.writeAttribute("durationInSeconds", m_testCaseTimer.getElapsedSeconds());

    if (!testCaseStats.stdOut.empty())
        m_xml.scopedElement("StdOut").writeText(trim(testCaseStats.stdOut), XmlFormatting::Newline);
    if (!testCaseStats.stdErr.empty())
        m_xml.scopedElement("StdErr").writeText(trim(testCaseStats.stdErr), XmlFormatting::Newline);

    m_xml.endElement();
}

void XmlReporter::testGroupEnded(TestGroupStats const &testGroupStats) {
    StreamingReporterBase::testGroupEnded(testGroupStats);
    // TODO: Check testGroupStats.aborting and act accordingly.
    m_xml.scopedElement("OverallResults")
            .writeAttribute("successes", testGroupStats.totals.assertions.passed)
            .writeAttribute("failures", testGroupStats.totals.assertions.failed)
            .writeAttribute("expectedFailures", testGroupStats.totals.assertions.failedButOk);
    m_xml.scopedElement("OverallResultsCases")
            .writeAttribute("successes", testGroupStats.totals.testCases.passed)
            .writeAttribute("failures", testGroupStats.totals.testCases.failed)
            .writeAttribute("expectedFailures", testGroupStats.totals.testCases.failedButOk);
    m_xml.endElement();
}

void XmlReporter::testRunEnded(TestRunStats const &testRunStats) {
    StreamingReporterBase::testRunEnded(testRunStats);
    m_xml.scopedElement("OverallResults")
            .writeAttribute("successes", testRunStats.totals.assertions.passed)
            .writeAttribute("failures", testRunStats.totals.assertions.failed)
            .writeAttribute("expectedFailures", testRunStats.totals.assertions.failedButOk);
    m_xml.scopedElement("OverallResultsCases")
            .writeAttribute("successes", testRunStats.totals.testCases.passed)
            .writeAttribute("failures", testRunStats.totals.testCases.failed)
            .writeAttribute("expectedFailures", testRunStats.totals.testCases.failedButOk);
    m_xml.endElement();
}

#if defined(CATCH_CONFIG_ENABLE_BENCHMARKING)
void XmlReporter::benchmarkPreparing(std::string const &name) {
    m_xml.startElement("BenchmarkResults").writeAttribute("name", name);
}

void XmlReporter::benchmarkStarting(BenchmarkInfo const &info) {
    m_xml.writeAttribute("samples", info.samples)
            .writeAttribute("resamples", info.resamples)
            .writeAttribute("iterations", info.iterations)
            .writeAttribute("clockResolution", info.clockResolution)
            .writeAttribute("estimatedDuration", info.estimatedDuration)
            .writeComment("All values in nano seconds");
}

void XmlReporter::benchmarkEnded(BenchmarkStats<> const &benchmarkStats) {
    m_xml.startElement("mean")
            .writeAttribute("value", benchmarkStats.mean.point.count())
            .writeAttribute("lowerBound", benchmarkStats.mean.lower_bound.count())
            .writeAttribute("upperBound", benchmarkStats.mean.upper_bound.count())
            .writeAttribute("ci", benchmarkStats.mean.confidence_interval);
    m_xml.endElement();
    m_xml.startElement("standardDeviation")
            .writeAttribute("value", benchmarkStats.standardDeviation.point.count())
            .writeAttribute("lowerBound", benchmarkStats.standardDeviation.lower_bound.count())
            .writeAttribute("upperBound", benchmarkStats.standardDeviation.upper_bound.count())
            .writeAttribute("ci", benchmarkStats.standardDeviation.confidence_interval);
    m_xml.endElement();
    m_xml.startElement("outliers")
            .writeAttribute("variance", benchmarkStats.outlierVariance)
            .writeAttribute("lowMild", benchmarkStats.outliers.low_mild)
            .writeAttribute("lowSevere", benchmarkStats.outliers.low_severe)
            .writeAttribute("highMild", benchmarkStats.outliers.high_mild)
            .writeAttribute("highSevere", benchmarkStats.outliers.high_severe);
    m_xml.endElement();
    m_xml.endElement();
}

void XmlReporter::benchmarkFailed(std::string const &error) {
    m_xml.scopedElement("failed").writeAttribute("message", error);
    m_xml.endElement();
}
#endif  // CATCH_CONFIG_ENABLE_BENCHMARKING

CATCH_REGISTER_REPORTER("xml", XmlReporter)

}  // end namespace Catch

#if defined(_MSC_VER)
#pragma warning(pop)
#endif
// end catch_reporter_xml.cpp

namespace Catch {
LeakDetector leakDetector;
}

#ifdef __clang__
#pragma clang diagnostic pop
#endif

// end catch_impl.hpp
#endif

#ifdef CATCH_CONFIG_MAIN
// start catch_default_main.hpp

#ifndef __OBJC__

#if defined(CATCH_CONFIG_WCHAR) && defined(CATCH_PLATFORM_WINDOWS) && defined(_UNICODE) && \
        !defined(DO_NOT_USE_WMAIN)
// Standard C/C++ Win32 Unicode wmain entry point
extern "C" int wmain(int argc, wchar_t *argv[], wchar_t *[]) {
#else
// Standard C/C++ main entry point
int main(int argc, char *argv[]) {
#endif

    return Catch::Session().run(argc, argv);
}

#else  // __OBJC__

// Objective-C entry point
int main(int argc, char *const argv[]) {
#if !CATCH_ARC_ENABLED
    NSAutoreleasePool *pool = [[NSAutoreleasePool alloc] init];
#endif

    Catch::registerTestMethods();
    int result = Catch::Session().run(argc, (char **)argv);

#if !CATCH_ARC_ENABLED
    [pool drain];
#endif

    return result;
}

#endif  // __OBJC__

// end catch_default_main.hpp
#endif

#if !defined(CATCH_CONFIG_IMPL_ONLY)

#ifdef CLARA_CONFIG_MAIN_NOT_DEFINED
#undef CLARA_CONFIG_MAIN
#endif

#if !defined(CATCH_CONFIG_DISABLE)
//////
// If this config identifier is defined then all CATCH macros are prefixed with
// CATCH_
#ifdef CATCH_CONFIG_PREFIX_ALL

#define CATCH_REQUIRE(...) \
    INTERNAL_CATCH_TEST("CATCH_REQUIRE", Catch::ResultDisposition::Normal, __VA_ARGS__)
#define CATCH_REQUIRE_FALSE(...)                                                                \
    INTERNAL_CATCH_TEST("CATCH_REQUIRE_FALSE",                                                  \
                        Catch::ResultDisposition::Normal | Catch::ResultDisposition::FalseTest, \
                        __VA_ARGS__)

#define CATCH_REQUIRE_THROWS(...) \
    INTERNAL_CATCH_THROWS("CATCH_REQUIRE_THROWS", Catch::ResultDisposition::Normal, __VA_ARGS__)
#define CATCH_REQUIRE_THROWS_AS(expr, exceptionType)                   \
    INTERNAL_CATCH_THROWS_AS("CATCH_REQUIRE_THROWS_AS", exceptionType, \
                             Catch::ResultDisposition::Normal, expr)
#define CATCH_REQUIRE_THROWS_WITH(expr, matcher)                   \
    INTERNAL_CATCH_THROWS_STR_MATCHES("CATCH_REQUIRE_THROWS_WITH", \
                                      Catch::ResultDisposition::Normal, matcher, expr)
#if !defined(CATCH_CONFIG_DISABLE_MATCHERS)
#define CATCH_REQUIRE_THROWS_MATCHES(expr, exceptionType, matcher)               \
    INTERNAL_CATCH_THROWS_MATCHES("CATCH_REQUIRE_THROWS_MATCHES", exceptionType, \
                                  Catch::ResultDisposition::Normal, matcher, expr)
#endif  // CATCH_CONFIG_DISABLE_MATCHERS
#define CATCH_REQUIRE_NOTHROW(...) \
    INTERNAL_CATCH_NO_THROW("CATCH_REQUIRE_NOTHROW", Catch::ResultDisposition::Normal, __VA_ARGS__)

#define CATCH_CHECK(...) \
    INTERNAL_CATCH_TEST("CATCH_CHECK", Catch::ResultDisposition::ContinueOnFailure, __VA_ARGS__)
#define CATCH_CHECK_FALSE(...)                                                                 \
    INTERNAL_CATCH_TEST(                                                                       \
            "CATCH_CHECK_FALSE",                                                               \
            Catch::ResultDisposition::ContinueOnFailure | Catch::ResultDisposition::FalseTest, \
            __VA_ARGS__)
#define CATCH_CHECKED_IF(...) \
    INTERNAL_CATCH_IF("CATCH_CHECKED_IF", Catch::ResultDisposition::ContinueOnFailure, __VA_ARGS__)
#define CATCH_CHECKED_ELSE(...)                                                            \
    INTERNAL_CATCH_ELSE("CATCH_CHECKED_ELSE", Catch::ResultDisposition::ContinueOnFailure, \
                        __VA_ARGS__)
#define CATCH_CHECK_NOFAIL(...)                                                                   \
    INTERNAL_CATCH_TEST(                                                                          \
            "CATCH_CHECK_NOFAIL",                                                                 \
            Catch::ResultDisposition::ContinueOnFailure | Catch::ResultDisposition::SuppressFail, \
            __VA_ARGS__)

#define CATCH_CHECK_THROWS(...)                                                              \
    INTERNAL_CATCH_THROWS("CATCH_CHECK_THROWS", Catch::ResultDisposition::ContinueOnFailure, \
                          __VA_ARGS__)
#define CATCH_CHECK_THROWS_AS(expr, exceptionType)                   \
    INTERNAL_CATCH_THROWS_AS("CATCH_CHECK_THROWS_AS", exceptionType, \
                             Catch::ResultDisposition::ContinueOnFailure, expr)
#define CATCH_CHECK_THROWS_WITH(expr, matcher)                   \
    INTERNAL_CATCH_THROWS_STR_MATCHES("CATCH_CHECK_THROWS_WITH", \
                                      Catch::ResultDisposition::ContinueOnFailure, matcher, expr)
#if !defined(CATCH_CONFIG_DISABLE_MATCHERS)
#define CATCH_CHECK_THROWS_MATCHES(expr, exceptionType, matcher)               \
    INTERNAL_CATCH_THROWS_MATCHES("CATCH_CHECK_THROWS_MATCHES", exceptionType, \
                                  Catch::ResultDisposition::ContinueOnFailure, matcher, expr)
#endif  // CATCH_CONFIG_DISABLE_MATCHERS
#define CATCH_CHECK_NOTHROW(...)                                                                \
    INTERNAL_CATCH_NO_THROW("CATCH_CHECK_NOTHROW", Catch::ResultDisposition::ContinueOnFailure, \
                            __VA_ARGS__)

#if !defined(CATCH_CONFIG_DISABLE_MATCHERS)
#define CATCH_CHECK_THAT(arg, matcher)                                                            \
    INTERNAL_CHECK_THAT("CATCH_CHECK_THAT", matcher, Catch::ResultDisposition::ContinueOnFailure, \
                        arg)

#define CATCH_REQUIRE_THAT(arg, matcher) \
    INTERNAL_CHECK_THAT("CATCH_REQUIRE_THAT", matcher, Catch::ResultDisposition::Normal, arg)
#endif  // CATCH_CONFIG_DISABLE_MATCHERS

#define CATCH_INFO(msg) INTERNAL_CATCH_INFO("CATCH_INFO", msg)
#define CATCH_UNSCOPED_INFO(msg) INTERNAL_CATCH_UNSCOPED_INFO("CATCH_UNSCOPED_INFO", msg)
#define CATCH_WARN(msg)                                         \
    INTERNAL_CATCH_MSG("CATCH_WARN", Catch::ResultWas::Warning, \
                       Catch::ResultDisposition::ContinueOnFailure, msg)
#define CATCH_CAPTURE(...) \
    INTERNAL_CATCH_CAPTURE(INTERNAL_CATCH_UNIQUE_NAME(capturer), "CATCH_CAPTURE", __VA_ARGS__)

#define CATCH_TEST_CASE(...) INTERNAL_CATCH_TESTCASE(__VA_ARGS__)
#define CATCH_TEST_CASE_METHOD(className, ...) \
    INTERNAL_CATCH_TEST_CASE_METHOD(className, __VA_ARGS__)
#define CATCH_METHOD_AS_TEST_CASE(method, ...) \
    INTERNAL_CATCH_METHOD_AS_TEST_CASE(method, __VA_ARGS__)
#define CATCH_REGISTER_TEST_CASE(Function, ...) \
    INTERNAL_CATCH_REGISTER_TESTCASE(Function, __VA_ARGS__)
#define CATCH_SECTION(...) INTERNAL_CATCH_SECTION(__VA_ARGS__)
#define CATCH_DYNAMIC_SECTION(...) INTERNAL_CATCH_DYNAMIC_SECTION(__VA_ARGS__)
#define CATCH_FAIL(...)                                                 \
    INTERNAL_CATCH_MSG("CATCH_FAIL", Catch::ResultWas::ExplicitFailure, \
                       Catch::ResultDisposition::Normal, __VA_ARGS__)
#define CATCH_FAIL_CHECK(...)                                                 \
    INTERNAL_CATCH_MSG("CATCH_FAIL_CHECK", Catch::ResultWas::ExplicitFailure, \
                       Catch::ResultDisposition::ContinueOnFailure, __VA_ARGS__)
#define CATCH_SUCCEED(...)                                    \
    INTERNAL_CATCH_MSG("CATCH_SUCCEED", Catch::ResultWas::Ok, \
                       Catch::ResultDisposition::ContinueOnFailure, __VA_ARGS__)

#define CATCH_ANON_TEST_CASE() INTERNAL_CATCH_TESTCASE()

#ifndef CATCH_CONFIG_TRADITIONAL_MSVC_PREPROCESSOR
#define CATCH_TEMPLATE_TEST_CASE(...) INTERNAL_CATCH_TEMPLATE_TEST_CASE(__VA_ARGS__)
#define CATCH_TEMPLATE_TEST_CASE_SIG(...) INTERNAL_CATCH_TEMPLATE_TEST_CASE_SIG(__VA_ARGS__)
#define CATCH_TEMPLATE_TEST_CASE_METHOD(className, ...) \
    INTERNAL_CATCH_TEMPLATE_TEST_CASE_METHOD(className, __VA_ARGS__)
#define CATCH_TEMPLATE_TEST_CASE_METHOD_SIG(className, ...) \
    INTERNAL_CATCH_TEMPLATE_TEST_CASE_METHOD_SIG(className, __VA_ARGS__)
#define CATCH_TEMPLATE_PRODUCT_TEST_CASE(...) INTERNAL_CATCH_TEMPLATE_PRODUCT_TEST_CASE(__VA_ARGS__)
#define CATCH_TEMPLATE_PRODUCT_TEST_CASE_SIG(...) \
    INTERNAL_CATCH_TEMPLATE_PRODUCT_TEST_CASE_SIG(__VA_ARGS__)
#define CATCH_TEMPLATE_PRODUCT_TEST_CASE_METHOD(className, ...) \
    INTERNAL_CATCH_TEMPLATE_PRODUCT_TEST_CASE_METHOD(className, __VA_ARGS__)
#define CATCH_TEMPLATE_PRODUCT_TEST_CASE_METHOD_SIG(className, ...) \
    INTERNAL_CATCH_TEMPLATE_PRODUCT_TEST_CASE_METHOD_SIG(className, __VA_ARGS__)
#else
#define CATCH_TEMPLATE_TEST_CASE(...) \
    INTERNAL_CATCH_EXPAND_VARGS(INTERNAL_CATCH_TEMPLATE_TEST_CASE(__VA_ARGS__))
#define CATCH_TEMPLATE_TEST_CASE_SIG(...) \
    INTERNAL_CATCH_EXPAND_VARGS(INTERNAL_CATCH_TEMPLATE_TEST_CASE_SIG(__VA_ARGS__))
#define CATCH_TEMPLATE_TEST_CASE_METHOD(className, ...) \
    INTERNAL_CATCH_EXPAND_VARGS(INTERNAL_CATCH_TEMPLATE_TEST_CASE_METHOD(className, __VA_ARGS__))
#define CATCH_TEMPLATE_TEST_CASE_METHOD_SIG(className, ...) \
    INTERNAL_CATCH_EXPAND_VARGS(                            \
            INTERNAL_CATCH_TEMPLATE_TEST_CASE_METHOD_SIG(className, __VA_ARGS__))
#define CATCH_TEMPLATE_PRODUCT_TEST_CASE(...) \
    INTERNAL_CATCH_EXPAND_VARGS(INTERNAL_CATCH_TEMPLATE_PRODUCT_TEST_CASE(__VA_ARGS__))
#define CATCH_TEMPLATE_PRODUCT_TEST_CASE_SIG(...) \
    INTERNAL_CATCH_EXPAND_VARGS(INTERNAL_CATCH_TEMPLATE_PRODUCT_TEST_CASE_SIG(__VA_ARGS__))
#define CATCH_TEMPLATE_PRODUCT_TEST_CASE_METHOD(className, ...) \
    INTERNAL_CATCH_EXPAND_VARGS(                                \
            INTERNAL_CATCH_TEMPLATE_PRODUCT_TEST_CASE_METHOD(className, __VA_ARGS__))
#define CATCH_TEMPLATE_PRODUCT_TEST_CASE_METHOD_SIG(className, ...) \
    INTERNAL_CATCH_EXPAND_VARGS(                                    \
            INTERNAL_CATCH_TEMPLATE_PRODUCT_TEST_CASE_METHOD_SIG(className, __VA_ARGS__))
#endif

#if !defined(CATCH_CONFIG_RUNTIME_STATIC_REQUIRE)
#define CATCH_STATIC_REQUIRE(...)             \
    static_assert(__VA_ARGS__, #__VA_ARGS__); \
    CATCH_SUCCEED(#__VA_ARGS__)
#define CATCH_STATIC_REQUIRE_FALSE(...)                   \
    static_assert(!(__VA_ARGS__), "!(" #__VA_ARGS__ ")"); \
    CATCH_SUCCEED(#__VA_ARGS__)
#else
#define CATCH_STATIC_REQUIRE(...) CATCH_REQUIRE(__VA_ARGS__)
#define CATCH_STATIC_REQUIRE_FALSE(...) CATCH_REQUIRE_FALSE(__VA_ARGS__)
#endif

// "BDD-style" convenience wrappers
#define CATCH_SCENARIO(...) CATCH_TEST_CASE("Scenario: " __VA_ARGS__)
#define CATCH_SCENARIO_METHOD(className, ...) \
    INTERNAL_CATCH_TEST_CASE_METHOD(className, "Scenario: " __VA_ARGS__)
#define CATCH_GIVEN(desc) INTERNAL_CATCH_DYNAMIC_SECTION("    Given: " << desc)
#define CATCH_AND_GIVEN(desc) INTERNAL_CATCH_DYNAMIC_SECTION("And given: " << desc)
#define CATCH_WHEN(desc) INTERNAL_CATCH_DYNAMIC_SECTION("     When: " << desc)
#define CATCH_AND_WHEN(desc) INTERNAL_CATCH_DYNAMIC_SECTION(" And when: " << desc)
#define CATCH_THEN(desc) INTERNAL_CATCH_DYNAMIC_SECTION("     Then: " << desc)
#define CATCH_AND_THEN(desc) INTERNAL_CATCH_DYNAMIC_SECTION("      And: " << desc)

#if defined(CATCH_CONFIG_ENABLE_BENCHMARKING)
#define CATCH_BENCHMARK(...)                                                             \
    INTERNAL_CATCH_BENCHMARK(INTERNAL_CATCH_UNIQUE_NAME(____C_A_T_C_H____B_E_N_C_H____), \
                             INTERNAL_CATCH_GET_1_ARG(__VA_ARGS__, , ),                  \
                             INTERNAL_CATCH_GET_2_ARG(__VA_ARGS__, , ))
#define CATCH_BENCHMARK_ADVANCED(name)                                                            \
    INTERNAL_CATCH_BENCHMARK_ADVANCED(INTERNAL_CATCH_UNIQUE_NAME(____C_A_T_C_H____B_E_N_C_H____), \
                                      name)
#endif  // CATCH_CONFIG_ENABLE_BENCHMARKING

// If CATCH_CONFIG_PREFIX_ALL is not defined then the CATCH_ prefix is not
// required
#else

#define REQUIRE(...) INTERNAL_CATCH_TEST("REQUIRE", Catch::ResultDisposition::Normal, __VA_ARGS__)
#define REQUIRE_FALSE(...)                                                                      \
    INTERNAL_CATCH_TEST("REQUIRE_FALSE",                                                        \
                        Catch::ResultDisposition::Normal | Catch::ResultDisposition::FalseTest, \
                        __VA_ARGS__)

#define REQUIRE_THROWS(...) \
    INTERNAL_CATCH_THROWS("REQUIRE_THROWS", Catch::ResultDisposition::Normal, __VA_ARGS__)
#define REQUIRE_THROWS_AS(expr, exceptionType)                                                     \
    INTERNAL_CATCH_THROWS_AS("REQUIRE_THROWS_AS", exceptionType, Catch::ResultDisposition::Normal, \
                             expr)
#define REQUIRE_THROWS_WITH(expr, matcher)                                                     \
    INTERNAL_CATCH_THROWS_STR_MATCHES("REQUIRE_THROWS_WITH", Catch::ResultDisposition::Normal, \
                                      matcher, expr)
#if !defined(CATCH_CONFIG_DISABLE_MATCHERS)
#define REQUIRE_THROWS_MATCHES(expr, exceptionType, matcher)               \
    INTERNAL_CATCH_THROWS_MATCHES("REQUIRE_THROWS_MATCHES", exceptionType, \
                                  Catch::ResultDisposition::Normal, matcher, expr)
#endif  // CATCH_CONFIG_DISABLE_MATCHERS
#define REQUIRE_NOTHROW(...) \
    INTERNAL_CATCH_NO_THROW("REQUIRE_NOTHROW", Catch::ResultDisposition::Normal, __VA_ARGS__)

#define CHECK(...) \
    INTERNAL_CATCH_TEST("CHECK", Catch::ResultDisposition::ContinueOnFailure, __VA_ARGS__)
#define CHECK_FALSE(...)                                                                       \
    INTERNAL_CATCH_TEST(                                                                       \
            "CHECK_FALSE",                                                                     \
            Catch::ResultDisposition::ContinueOnFailure | Catch::ResultDisposition::FalseTest, \
            __VA_ARGS__)
#define CHECKED_IF(...) \
    INTERNAL_CATCH_IF("CHECKED_IF", Catch::ResultDisposition::ContinueOnFailure, __VA_ARGS__)
#define CHECKED_ELSE(...) \
    INTERNAL_CATCH_ELSE("CHECKED_ELSE", Catch::ResultDisposition::ContinueOnFailure, __VA_ARGS__)
#define CHECK_NOFAIL(...)                                                                         \
    INTERNAL_CATCH_TEST(                                                                          \
            "CHECK_NOFAIL",                                                                       \
            Catch::ResultDisposition::ContinueOnFailure | Catch::ResultDisposition::SuppressFail, \
            __VA_ARGS__)

#define CHECK_THROWS(...) \
    INTERNAL_CATCH_THROWS("CHECK_THROWS", Catch::ResultDisposition::ContinueOnFailure, __VA_ARGS__)
#define CHECK_THROWS_AS(expr, exceptionType)                   \
    INTERNAL_CATCH_THROWS_AS("CHECK_THROWS_AS", exceptionType, \
                             Catch::ResultDisposition::ContinueOnFailure, expr)
#define CHECK_THROWS_WITH(expr, matcher)                   \
    INTERNAL_CATCH_THROWS_STR_MATCHES("CHECK_THROWS_WITH", \
                                      Catch::ResultDisposition::ContinueOnFailure, matcher, expr)
#if !defined(CATCH_CONFIG_DISABLE_MATCHERS)
#define CHECK_THROWS_MATCHES(expr, exceptionType, matcher)               \
    INTERNAL_CATCH_THROWS_MATCHES("CHECK_THROWS_MATCHES", exceptionType, \
                                  Catch::ResultDisposition::ContinueOnFailure, matcher, expr)
#endif  // CATCH_CONFIG_DISABLE_MATCHERS
#define CHECK_NOTHROW(...)                                                                \
    INTERNAL_CATCH_NO_THROW("CHECK_NOTHROW", Catch::ResultDisposition::ContinueOnFailure, \
                            __VA_ARGS__)

#if !defined(CATCH_CONFIG_DISABLE_MATCHERS)
#define CHECK_THAT(arg, matcher) \
    INTERNAL_CHECK_THAT("CHECK_THAT", matcher, Catch::ResultDisposition::ContinueOnFailure, arg)

#define REQUIRE_THAT(arg, matcher) \
    INTERNAL_CHECK_THAT("REQUIRE_THAT", matcher, Catch::ResultDisposition::Normal, arg)
#endif  // CATCH_CONFIG_DISABLE_MATCHERS

#define INFO(msg) INTERNAL_CATCH_INFO("INFO", msg)
#define UNSCOPED_INFO(msg) INTERNAL_CATCH_UNSCOPED_INFO("UNSCOPED_INFO", msg)
#define WARN(msg)                                         \
    INTERNAL_CATCH_MSG("WARN", Catch::ResultWas::Warning, \
                       Catch::ResultDisposition::ContinueOnFailure, msg)
#define CAPTURE(...) \
    INTERNAL_CATCH_CAPTURE(INTERNAL_CATCH_UNIQUE_NAME(capturer), "CAPTURE", __VA_ARGS__)

#define TEST_CASE(...) INTERNAL_CATCH_TESTCASE(__VA_ARGS__)
#define TEST_CASE_METHOD(className, ...) INTERNAL_CATCH_TEST_CASE_METHOD(className, __VA_ARGS__)
#define METHOD_AS_TEST_CASE(method, ...) INTERNAL_CATCH_METHOD_AS_TEST_CASE(method, __VA_ARGS__)
#define REGISTER_TEST_CASE(Function, ...) INTERNAL_CATCH_REGISTER_TESTCASE(Function, __VA_ARGS__)
#define SECTION(...) INTERNAL_CATCH_SECTION(__VA_ARGS__)
#define DYNAMIC_SECTION(...) INTERNAL_CATCH_DYNAMIC_SECTION(__VA_ARGS__)
#define FAIL(...)                                                 \
    INTERNAL_CATCH_MSG("FAIL", Catch::ResultWas::ExplicitFailure, \
                       Catch::ResultDisposition::Normal, __VA_ARGS__)
#define FAIL_CHECK(...)                                                 \
    INTERNAL_CATCH_MSG("FAIL_CHECK", Catch::ResultWas::ExplicitFailure, \
                       Catch::ResultDisposition::ContinueOnFailure, __VA_ARGS__)
#define SUCCEED(...)                                    \
    INTERNAL_CATCH_MSG("SUCCEED", Catch::ResultWas::Ok, \
                       Catch::ResultDisposition::ContinueOnFailure, __VA_ARGS__)
#define ANON_TEST_CASE() INTERNAL_CATCH_TESTCASE()

#ifndef CATCH_CONFIG_TRADITIONAL_MSVC_PREPROCESSOR
#define TEMPLATE_TEST_CASE(...) INTERNAL_CATCH_TEMPLATE_TEST_CASE(__VA_ARGS__)
#define TEMPLATE_TEST_CASE_SIG(...) INTERNAL_CATCH_TEMPLATE_TEST_CASE_SIG(__VA_ARGS__)
#define TEMPLATE_TEST_CASE_METHOD(className, ...) \
    INTERNAL_CATCH_TEMPLATE_TEST_CASE_METHOD(className, __VA_ARGS__)
#define TEMPLATE_TEST_CASE_METHOD_SIG(className, ...) \
    INTERNAL_CATCH_TEMPLATE_TEST_CASE_METHOD_SIG(className, __VA_ARGS__)
#define TEMPLATE_PRODUCT_TEST_CASE(...) INTERNAL_CATCH_TEMPLATE_PRODUCT_TEST_CASE(__VA_ARGS__)
#define TEMPLATE_PRODUCT_TEST_CASE_SIG(...) \
    INTERNAL_CATCH_TEMPLATE_PRODUCT_TEST_CASE_SIG(__VA_ARGS__)
#define TEMPLATE_PRODUCT_TEST_CASE_METHOD(className, ...) \
    INTERNAL_CATCH_TEMPLATE_PRODUCT_TEST_CASE_METHOD(className, __VA_ARGS__)
#define TEMPLATE_PRODUCT_TEST_CASE_METHOD_SIG(className, ...) \
    INTERNAL_CATCH_TEMPLATE_PRODUCT_TEST_CASE_METHOD_SIG(className, __VA_ARGS__)
#define TEMPLATE_LIST_TEST_CASE(...) INTERNAL_CATCH_TEMPLATE_LIST_TEST_CASE(__VA_ARGS__)
#define TEMPLATE_LIST_TEST_CASE_METHOD(className, ...) \
    INTERNAL_CATCH_TEMPLATE_LIST_TEST_CASE_METHOD(className, __VA_ARGS__)
#else
#define TEMPLATE_TEST_CASE(...) \
    INTERNAL_CATCH_EXPAND_VARGS(INTERNAL_CATCH_TEMPLATE_TEST_CASE(__VA_ARGS__))
#define TEMPLATE_TEST_CASE_SIG(...) \
    INTERNAL_CATCH_EXPAND_VARGS(INTERNAL_CATCH_TEMPLATE_TEST_CASE_SIG(__VA_ARGS__))
#define TEMPLATE_TEST_CASE_METHOD(className, ...) \
    INTERNAL_CATCH_EXPAND_VARGS(INTERNAL_CATCH_TEMPLATE_TEST_CASE_METHOD(className, __VA_ARGS__))
#define TEMPLATE_TEST_CASE_METHOD_SIG(className, ...) \
    INTERNAL_CATCH_EXPAND_VARGS(                      \
            INTERNAL_CATCH_TEMPLATE_TEST_CASE_METHOD_SIG(className, __VA_ARGS__))
#define TEMPLATE_PRODUCT_TEST_CASE(...) \
    INTERNAL_CATCH_EXPAND_VARGS(INTERNAL_CATCH_TEMPLATE_PRODUCT_TEST_CASE(__VA_ARGS__))
#define TEMPLATE_PRODUCT_TEST_CASE_SIG(...) \
    INTERNAL_CATCH_EXPAND_VARGS(INTERNAL_CATCH_TEMPLATE_PRODUCT_TEST_CASE_SIG(__VA_ARGS__))
#define TEMPLATE_PRODUCT_TEST_CASE_METHOD(className, ...) \
    INTERNAL_CATCH_EXPAND_VARGS(                          \
            INTERNAL_CATCH_TEMPLATE_PRODUCT_TEST_CASE_METHOD(className, __VA_ARGS__))
#define TEMPLATE_PRODUCT_TEST_CASE_METHOD_SIG(className, ...) \
    INTERNAL_CATCH_EXPAND_VARGS(                              \
            INTERNAL_CATCH_TEMPLATE_PRODUCT_TEST_CASE_METHOD_SIG(className, __VA_ARGS__))
#define TEMPLATE_LIST_TEST_CASE(...) \
    INTERNAL_CATCH_EXPAND_VARGS(INTERNAL_CATCH_TEMPLATE_LIST_TEST_CASE(__VA_ARGS__))
#define TEMPLATE_LIST_TEST_CASE_METHOD(className, ...) \
    INTERNAL_CATCH_EXPAND_VARGS(                       \
            INTERNAL_CATCH_TEMPLATE_LIST_TEST_CASE_METHOD(className, __VA_ARGS__))
#endif

#if !defined(CATCH_CONFIG_RUNTIME_STATIC_REQUIRE)
#define STATIC_REQUIRE(...)                   \
    static_assert(__VA_ARGS__, #__VA_ARGS__); \
    SUCCEED(#__VA_ARGS__)
#define STATIC_REQUIRE_FALSE(...)                         \
    static_assert(!(__VA_ARGS__), "!(" #__VA_ARGS__ ")"); \
    SUCCEED("!(" #__VA_ARGS__ ")")
#else
#define STATIC_REQUIRE(...) REQUIRE(__VA_ARGS__)
#define STATIC_REQUIRE_FALSE(...) REQUIRE_FALSE(__VA_ARGS__)
#endif

#endif

#define CATCH_TRANSLATE_EXCEPTION(signature) INTERNAL_CATCH_TRANSLATE_EXCEPTION(signature)

// "BDD-style" convenience wrappers
#define SCENARIO(...) TEST_CASE("Scenario: " __VA_ARGS__)
#define SCENARIO_METHOD(className, ...) \
    INTERNAL_CATCH_TEST_CASE_METHOD(className, "Scenario: " __VA_ARGS__)

#define GIVEN(desc) INTERNAL_CATCH_DYNAMIC_SECTION("    Given: " << desc)
#define AND_GIVEN(desc) INTERNAL_CATCH_DYNAMIC_SECTION("And given: " << desc)
#define WHEN(desc) INTERNAL_CATCH_DYNAMIC_SECTION("     When: " << desc)
#define AND_WHEN(desc) INTERNAL_CATCH_DYNAMIC_SECTION(" And when: " << desc)
#define THEN(desc) INTERNAL_CATCH_DYNAMIC_SECTION("     Then: " << desc)
#define AND_THEN(desc) INTERNAL_CATCH_DYNAMIC_SECTION("      And: " << desc)

#if defined(CATCH_CONFIG_ENABLE_BENCHMARKING)
#define BENCHMARK(...)                                                                   \
    INTERNAL_CATCH_BENCHMARK(INTERNAL_CATCH_UNIQUE_NAME(____C_A_T_C_H____B_E_N_C_H____), \
                             INTERNAL_CATCH_GET_1_ARG(__VA_ARGS__, , ),                  \
                             INTERNAL_CATCH_GET_2_ARG(__VA_ARGS__, , ))
#define BENCHMARK_ADVANCED(name)                                                                  \
    INTERNAL_CATCH_BENCHMARK_ADVANCED(INTERNAL_CATCH_UNIQUE_NAME(____C_A_T_C_H____B_E_N_C_H____), \
                                      name)
#endif  // CATCH_CONFIG_ENABLE_BENCHMARKING

using Catch::Detail::Approx;

#else  // CATCH_CONFIG_DISABLE

//////
// If this config identifier is defined then all CATCH macros are prefixed with
// CATCH_
#ifdef CATCH_CONFIG_PREFIX_ALL

#define CATCH_REQUIRE(...) (void)(0)
#define CATCH_REQUIRE_FALSE(...) (void)(0)

#define CATCH_REQUIRE_THROWS(...) (void)(0)
#define CATCH_REQUIRE_THROWS_AS(expr, exceptionType) (void)(0)
#define CATCH_REQUIRE_THROWS_WITH(expr, matcher) (void)(0)
#if !defined(CATCH_CONFIG_DISABLE_MATCHERS)
#define CATCH_REQUIRE_THROWS_MATCHES(expr, exceptionType, matcher) (void)(0)
#endif  // CATCH_CONFIG_DISABLE_MATCHERS
#define CATCH_REQUIRE_NOTHROW(...) (void)(0)

#define CATCH_CHECK(...) (void)(0)
#define CATCH_CHECK_FALSE(...) (void)(0)
#define CATCH_CHECKED_IF(...) if (__VA_ARGS__)
#define CATCH_CHECKED_ELSE(...) if (!(__VA_ARGS__))
#define CATCH_CHECK_NOFAIL(...) (void)(0)

#define CATCH_CHECK_THROWS(...) (void)(0)
#define CATCH_CHECK_THROWS_AS(expr, exceptionType) (void)(0)
#define CATCH_CHECK_THROWS_WITH(expr, matcher) (void)(0)
#if !defined(CATCH_CONFIG_DISABLE_MATCHERS)
#define CATCH_CHECK_THROWS_MATCHES(expr, exceptionType, matcher) (void)(0)
#endif  // CATCH_CONFIG_DISABLE_MATCHERS
#define CATCH_CHECK_NOTHROW(...) (void)(0)

#if !defined(CATCH_CONFIG_DISABLE_MATCHERS)
#define CATCH_CHECK_THAT(arg, matcher) (void)(0)

#define CATCH_REQUIRE_THAT(arg, matcher) (void)(0)
#endif  // CATCH_CONFIG_DISABLE_MATCHERS

#define CATCH_INFO(msg) (void)(0)
#define CATCH_UNSCOPED_INFO(msg) (void)(0)
#define CATCH_WARN(msg) (void)(0)
#define CATCH_CAPTURE(msg) (void)(0)

#define CATCH_TEST_CASE(...)                 \
    INTERNAL_CATCH_TESTCASE_NO_REGISTRATION( \
            INTERNAL_CATCH_UNIQUE_NAME(____C_A_T_C_H____T_E_S_T____))
#define CATCH_TEST_CASE_METHOD(className, ...) \
    INTERNAL_CATCH_TESTCASE_NO_REGISTRATION(   \
            INTERNAL_CATCH_UNIQUE_NAME(____C_A_T_C_H____T_E_S_T____))
#define CATCH_METHOD_AS_TEST_CASE(method, ...)
#define CATCH_REGISTER_TEST_CASE(Function, ...) (void)(0)
#define CATCH_SECTION(...)
#define CATCH_DYNAMIC_SECTION(...)
#define CATCH_FAIL(...) (void)(0)
#define CATCH_FAIL_CHECK(...) (void)(0)
#define CATCH_SUCCEED(...) (void)(0)

#define CATCH_ANON_TEST_CASE()               \
    INTERNAL_CATCH_TESTCASE_NO_REGISTRATION( \
            INTERNAL_CATCH_UNIQUE_NAME(____C_A_T_C_H____T_E_S_T____))

#ifndef CATCH_CONFIG_TRADITIONAL_MSVC_PREPROCESSOR
#define CATCH_TEMPLATE_TEST_CASE(...) INTERNAL_CATCH_TEMPLATE_TEST_CASE_NO_REGISTRATION(__VA_ARGS__)
#define CATCH_TEMPLATE_TEST_CASE_SIG(...) \
    INTERNAL_CATCH_TEMPLATE_TEST_CASE_SIG_NO_REGISTRATION(__VA_ARGS__)
#define CATCH_TEMPLATE_TEST_CASE_METHOD(className, ...) \
    INTERNAL_CATCH_TEMPLATE_TEST_CASE_METHOD_NO_REGISTRATION(className, __VA_ARGS__)
#define CATCH_TEMPLATE_TEST_CASE_METHOD_SIG(className, ...) \
    INTERNAL_CATCH_TEMPLATE_TEST_CASE_METHOD_SIG_NO_REGISTRATION(className, __VA_ARGS__)
#define CATCH_TEMPLATE_PRODUCT_TEST_CASE(...) CATCH_TEMPLATE_TEST_CASE(__VA_ARGS__)
#define CATCH_TEMPLATE_PRODUCT_TEST_CASE_SIG(...) CATCH_TEMPLATE_TEST_CASE(__VA_ARGS__)
#define CATCH_TEMPLATE_PRODUCT_TEST_CASE_METHOD(className, ...) \
    CATCH_TEMPLATE_TEST_CASE_METHOD(className, __VA_ARGS__)
#define CATCH_TEMPLATE_PRODUCT_TEST_CASE_METHOD_SIG(className, ...) \
    CATCH_TEMPLATE_TEST_CASE_METHOD(className, __VA_ARGS__)
#else
#define CATCH_TEMPLATE_TEST_CASE(...) \
    INTERNAL_CATCH_EXPAND_VARGS(INTERNAL_CATCH_TEMPLATE_TEST_CASE_NO_REGISTRATION(__VA_ARGS__))
#define CATCH_TEMPLATE_TEST_CASE_SIG(...) \
    INTERNAL_CATCH_EXPAND_VARGS(INTERNAL_CATCH_TEMPLATE_TEST_CASE_SIG_NO_REGISTRATION(__VA_ARGS__))
#define CATCH_TEMPLATE_TEST_CASE_METHOD(className, ...) \
    INTERNAL_CATCH_EXPAND_VARGS(                        \
            INTERNAL_CATCH_TEMPLATE_TEST_CASE_METHOD_NO_REGISTRATION(className, __VA_ARGS__))
#define CATCH_TEMPLATE_TEST_CASE_METHOD_SIG(className, ...) \
    INTERNAL_CATCH_EXPAND_VARGS(                            \
            INTERNAL_CATCH_TEMPLATE_TEST_CASE_METHOD_SIG_NO_REGISTRATION(className, __VA_ARGS__))
#define CATCH_TEMPLATE_PRODUCT_TEST_CASE(...) CATCH_TEMPLATE_TEST_CASE(__VA_ARGS__)
#define CATCH_TEMPLATE_PRODUCT_TEST_CASE_SIG(...) CATCH_TEMPLATE_TEST_CASE(__VA_ARGS__)
#define CATCH_TEMPLATE_PRODUCT_TEST_CASE_METHOD(className, ...) \
    CATCH_TEMPLATE_TEST_CASE_METHOD(className, __VA_ARGS__)
#define CATCH_TEMPLATE_PRODUCT_TEST_CASE_METHOD_SIG(className, ...) \
    CATCH_TEMPLATE_TEST_CASE_METHOD(className, __VA_ARGS__)
#endif

// "BDD-style" convenience wrappers
#define CATCH_SCENARIO(...)                  \
    INTERNAL_CATCH_TESTCASE_NO_REGISTRATION( \
            INTERNAL_CATCH_UNIQUE_NAME(____C_A_T_C_H____T_E_S_T____))
#define CATCH_SCENARIO_METHOD(className, ...)       \
    INTERNAL_CATCH_TESTCASE_METHOD_NO_REGISTRATION( \
            INTERNAL_CATCH_UNIQUE_NAME(____C_A_T_C_H____T_E_S_T____), className)
#define CATCH_GIVEN(desc)
#define CATCH_AND_GIVEN(desc)
#define CATCH_WHEN(desc)
#define CATCH_AND_WHEN(desc)
#define CATCH_THEN(desc)
#define CATCH_AND_THEN(desc)

#define CATCH_STATIC_REQUIRE(...) (void)(0)
#define CATCH_STATIC_REQUIRE_FALSE(...) (void)(0)

// If CATCH_CONFIG_PREFIX_ALL is not defined then the CATCH_ prefix is not
// required
#else

#define REQUIRE(...) (void)(0)
#define REQUIRE_FALSE(...) (void)(0)

#define REQUIRE_THROWS(...) (void)(0)
#define REQUIRE_THROWS_AS(expr, exceptionType) (void)(0)
#define REQUIRE_THROWS_WITH(expr, matcher) (void)(0)
#if !defined(CATCH_CONFIG_DISABLE_MATCHERS)
#define REQUIRE_THROWS_MATCHES(expr, exceptionType, matcher) (void)(0)
#endif  // CATCH_CONFIG_DISABLE_MATCHERS
#define REQUIRE_NOTHROW(...) (void)(0)

#define CHECK(...) (void)(0)
#define CHECK_FALSE(...) (void)(0)
#define CHECKED_IF(...) if (__VA_ARGS__)
#define CHECKED_ELSE(...) if (!(__VA_ARGS__))
#define CHECK_NOFAIL(...) (void)(0)

#define CHECK_THROWS(...) (void)(0)
#define CHECK_THROWS_AS(expr, exceptionType) (void)(0)
#define CHECK_THROWS_WITH(expr, matcher) (void)(0)
#if !defined(CATCH_CONFIG_DISABLE_MATCHERS)
#define CHECK_THROWS_MATCHES(expr, exceptionType, matcher) (void)(0)
#endif  // CATCH_CONFIG_DISABLE_MATCHERS
#define CHECK_NOTHROW(...) (void)(0)

#if !defined(CATCH_CONFIG_DISABLE_MATCHERS)
#define CHECK_THAT(arg, matcher) (void)(0)

#define REQUIRE_THAT(arg, matcher) (void)(0)
#endif  // CATCH_CONFIG_DISABLE_MATCHERS

#define INFO(msg) (void)(0)
#define UNSCOPED_INFO(msg) (void)(0)
#define WARN(msg) (void)(0)
#define CAPTURE(msg) (void)(0)

#define TEST_CASE(...)                       \
    INTERNAL_CATCH_TESTCASE_NO_REGISTRATION( \
            INTERNAL_CATCH_UNIQUE_NAME(____C_A_T_C_H____T_E_S_T____))
#define TEST_CASE_METHOD(className, ...)     \
    INTERNAL_CATCH_TESTCASE_NO_REGISTRATION( \
            INTERNAL_CATCH_UNIQUE_NAME(____C_A_T_C_H____T_E_S_T____))
#define METHOD_AS_TEST_CASE(method, ...)
#define REGISTER_TEST_CASE(Function, ...) (void)(0)
#define SECTION(...)
#define DYNAMIC_SECTION(...)
#define FAIL(...) (void)(0)
#define FAIL_CHECK(...) (void)(0)
#define SUCCEED(...) (void)(0)
#define ANON_TEST_CASE()                     \
    INTERNAL_CATCH_TESTCASE_NO_REGISTRATION( \
            INTERNAL_CATCH_UNIQUE_NAME(____C_A_T_C_H____T_E_S_T____))

#ifndef CATCH_CONFIG_TRADITIONAL_MSVC_PREPROCESSOR
#define TEMPLATE_TEST_CASE(...) INTERNAL_CATCH_TEMPLATE_TEST_CASE_NO_REGISTRATION(__VA_ARGS__)
#define TEMPLATE_TEST_CASE_SIG(...) \
    INTERNAL_CATCH_TEMPLATE_TEST_CASE_SIG_NO_REGISTRATION(__VA_ARGS__)
#define TEMPLATE_TEST_CASE_METHOD(className, ...) \
    INTERNAL_CATCH_TEMPLATE_TEST_CASE_METHOD_NO_REGISTRATION(className, __VA_ARGS__)
#define TEMPLATE_TEST_CASE_METHOD_SIG(className, ...) \
    INTERNAL_CATCH_TEMPLATE_TEST_CASE_METHOD_SIG_NO_REGISTRATION(className, __VA_ARGS__)
#define TEMPLATE_PRODUCT_TEST_CASE(...) TEMPLATE_TEST_CASE(__VA_ARGS__)
#define TEMPLATE_PRODUCT_TEST_CASE_SIG(...) TEMPLATE_TEST_CASE(__VA_ARGS__)
#define TEMPLATE_PRODUCT_TEST_CASE_METHOD(className, ...) \
    TEMPLATE_TEST_CASE_METHOD(className, __VA_ARGS__)
#define TEMPLATE_PRODUCT_TEST_CASE_METHOD_SIG(className, ...) \
    TEMPLATE_TEST_CASE_METHOD(className, __VA_ARGS__)
#else
#define TEMPLATE_TEST_CASE(...) \
    INTERNAL_CATCH_EXPAND_VARGS(INTERNAL_CATCH_TEMPLATE_TEST_CASE_NO_REGISTRATION(__VA_ARGS__))
#define TEMPLATE_TEST_CASE_SIG(...) \
    INTERNAL_CATCH_EXPAND_VARGS(INTERNAL_CATCH_TEMPLATE_TEST_CASE_SIG_NO_REGISTRATION(__VA_ARGS__))
#define TEMPLATE_TEST_CASE_METHOD(className, ...) \
    INTERNAL_CATCH_EXPAND_VARGS(                  \
            INTERNAL_CATCH_TEMPLATE_TEST_CASE_METHOD_NO_REGISTRATION(className, __VA_ARGS__))
#define TEMPLATE_TEST_CASE_METHOD_SIG(className, ...) \
    INTERNAL_CATCH_EXPAND_VARGS(                      \
            INTERNAL_CATCH_TEMPLATE_TEST_CASE_METHOD_SIG_NO_REGISTRATION(className, __VA_ARGS__))
#define TEMPLATE_PRODUCT_TEST_CASE(...) TEMPLATE_TEST_CASE(__VA_ARGS__)
#define TEMPLATE_PRODUCT_TEST_CASE_SIG(...) TEMPLATE_TEST_CASE(__VA_ARGS__)
#define TEMPLATE_PRODUCT_TEST_CASE_METHOD(className, ...) \
    TEMPLATE_TEST_CASE_METHOD(className, __VA_ARGS__)
#define TEMPLATE_PRODUCT_TEST_CASE_METHOD_SIG(className, ...) \
    TEMPLATE_TEST_CASE_METHOD(className, __VA_ARGS__)
#endif

#define STATIC_REQUIRE(...) (void)(0)
#define STATIC_REQUIRE_FALSE(...) (void)(0)

#endif

#define CATCH_TRANSLATE_EXCEPTION(signature)   \
    INTERNAL_CATCH_TRANSLATE_EXCEPTION_NO_REG( \
            INTERNAL_CATCH_UNIQUE_NAME(catch_internal_ExceptionTranslator), signature)

// "BDD-style" convenience wrappers
#define SCENARIO(...)                        \
    INTERNAL_CATCH_TESTCASE_NO_REGISTRATION( \
            INTERNAL_CATCH_UNIQUE_NAME(____C_A_T_C_H____T_E_S_T____))
#define SCENARIO_METHOD(className, ...)             \
    INTERNAL_CATCH_TESTCASE_METHOD_NO_REGISTRATION( \
            INTERNAL_CATCH_UNIQUE_NAME(____C_A_T_C_H____T_E_S_T____), className)

#define GIVEN(desc)
#define AND_GIVEN(desc)
#define WHEN(desc)
#define AND_WHEN(desc)
#define THEN(desc)
#define AND_THEN(desc)

using Catch::Detail::Approx;

#endif

#endif  // ! CATCH_CONFIG_IMPL_ONLY

// start catch_reenable_warnings.h

#ifdef __clang__
#ifdef __ICC  // icpc defines the __clang__ macro
#pragma warning(pop)
#else
#pragma clang diagnostic pop
#endif
#elif defined __GNUC__
#pragma GCC diagnostic pop
#endif

// end catch_reenable_warnings.h
// end catch.hpp
#endif  // TWOBLUECUBES_SINGLE_INCLUDE_CATCH_HPP_INCLUDED


================================================
FILE: third_party/include/gsl/gsl
================================================
//
// gsl-lite is based on GSL: Guidelines Support Library.
// For more information see https://github.com/martinmoene/gsl-lite
//
// Copyright (c) 2015 Martin Moene
// Copyright (c) 2015 Microsoft Corporation. All rights reserved.
//
// This code is licensed under the MIT License (MIT).
//
// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
// IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
// FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
// AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
// LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
// OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
// THE SOFTWARE.

// mimic MS include hierarchy

#pragma once

#ifndef GSL_GSL_H_INCLUDED
#define GSL_GSL_H_INCLUDED

#pragma message ("gsl/gsl is deprecated since version 0.38.1, use gsl/gsl-lite.hpp instead.")

#include "gsl-lite.hpp"

#endif // GSL_GSL_H_INCLUDED


================================================
FILE: third_party/include/gsl/gsl-lite-vc6.hpp
================================================
//
// gsl-lite-vc6 is based on GSL: Guidelines Support Library,
// For more information see https://github.com/gsl-lite/gsl-lite
//
// Copyright (c) 2015 Martin Moene
// Copyright (c) 2015 Microsoft Corporation. All rights reserved.
//
// This code is licensed under the MIT License (MIT).
//
// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
// IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
// FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
// AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
// LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
// OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
// THE SOFTWARE.

#pragma once

#ifndef GSL_GSL_LITE_H_INCLUDED
#define GSL_GSL_LITE_H_INCLUDED

#include <exception>
#include <iterator>
#include <limits>
#include <memory>
#include <stdexcept>
#include <string>
#include <utility>
#include <vector>

#define gsl_lite_VERSION "0.0.0"

// Configuration:

#ifndef gsl_FEATURE_IMPLICIT_MACRO
#define gsl_FEATURE_IMPLICIT_MACRO 1
#endif

#ifndef gsl_FEATURE_OWNER_MACRO
#define gsl_FEATURE_OWNER_MACRO 1
#endif

#ifndef gsl_FEATURE_SHARED_PTR
#define gsl_FEATURE_SHARED_PTR 0
#endif

#ifndef gsl_FEATURE_UNIQUE_PTR
#define gsl_FEATURE_UNIQUE_PTR 0
#endif

#ifndef gsl_CONFIG_THROWS_FOR_TESTING
#define gsl_CONFIG_THROWS_FOR_TESTING 0
#endif

#ifndef gsl_CONFIG_CONFIRMS_COMPILATION_ERRORS
#define gsl_CONFIG_CONFIRMS_COMPILATION_ERRORS 0
#endif

#ifndef gsl_CONFIG_SHARED_PTR_INCLUDE
#define gsl_CONFIG_SHARED_PTR_INCLUDE <boost/shared_ptr.hpp>
#endif

#ifndef gsl_CONFIG_UNIQUE_PTR_INCLUDE
#define gsl_CONFIG_UNIQUE_PTR_INCLUDE <boost/unique_ptr.hpp>
#endif

#ifndef gsl_CONFIG_SHARED_PTR_DECL
#define gsl_CONFIG_SHARED_PTR_DECL boost::shared_ptr
#endif

#ifndef gsl_CONFIG_UNIQUE_PTR_DECL
#define gsl_CONFIG_UNIQUE_PTR_DECL boost::unique_ptr
#endif

// Compiler detection:

#if defined(_MSC_VER) && !defined(__clang__)
#define gsl_COMPILER_MSVC_VER (_MSC_VER)
#define gsl_COMPILER_MSVC_VERSION (_MSC_VER / 10 - 10 * (5 + (_MSC_VER < 1900)))
#else
#define gsl_COMPILER_MSVC_VER 0
#define gsl_COMPILER_MSVC_VERSION 0
#define gsl_COMPILER_NON_MSVC 1
#endif

#if gsl_COMPILER_MSVC_VERSION != 60
#error GSL Lite: this header is for Visual C++ 6
#endif

// half-open range [lo..hi):
#define gsl_BETWEEN(v, lo, hi) ((lo) <= (v) && (v) < (hi))

// Presence of C++ language features:

// C++ feature usage:

#if gsl_FEATURE_IMPLICIT_MACRO
#define implicit
#endif

#define gsl_DIMENSION_OF(a) (sizeof(a) / sizeof(0 [a]))

#if gsl_FEATURE_SHARED_PTR
#include gsl_CONFIG_SHARED_PTR_INCLUDE
#endif

#if gsl_FEATURE_UNIQUE_PTR
#include gsl_CONFIG_UNIQUE_PTR_INCLUDE
#endif

namespace gsl {

//
// GSL.owner: ownership pointers
//
// ToDo:
#if gsl_FEATURE_SHARED_PTR
using gsl_CONFIG_SHARED_PTR_DECL;
#endif
#if gsl_FEATURE_UNIQUE_PTR
using gsl_CONFIG_UNIQUE_PTR_DECL;
#endif

template <class T>
struct owner {
    typedef T type;
};

#define gsl_HAVE_OWNER_TEMPLATE 0

#if gsl_FEATURE_OWNER_MACRO
#define Owner(t) ::gsl::owner<t>::type
#endif

//
// GSL.assert: assertions
//
#define Expects(x) ::gsl::fail_fast_assert((x))
#define Ensures(x) ::gsl::fail_fast_assert((x))

#if gsl_CONFIG_THROWS_FOR_TESTING

struct fail_fast : public std::runtime_error {
    fail_fast() : std::runtime_error("GSL assertion") {}

    explicit fail_fast(char const *const message) : std::runtime_error(message) {}
};

inline void fail_fast_assert(bool cond) {
    if (!cond)
        throw fail_fast();
}

inline void fail_fast_assert(bool cond, char const *const message) {
    if (!cond)
        throw fail_fast(message);
}

#else  // gsl_CONFIG_THROWS_FOR_TESTING

inline void fail_fast_assert(bool cond) {
    if (!cond)
        terminate();
}

inline void fail_fast_assert(bool cond, char const *const) {
    if (!cond)
        terminate();
}

#endif  // gsl_CONFIG_THROWS_FOR_TESTING

//
// GSL.util: utilities
//

class final_action {
public:
    typedef void (*Action)();

    final_action(Action action) : action_(action) {}

    ~final_action() { action_(); }

private:
    Action action_;
};

template <class Fn>
final_action finally(Fn const &f) {
    return final_action((f));
}

template <class T, class U>
T narrow_cast(U u) {
    return static_cast<T>(u);
}

struct narrowing_error : public std::exception {};

template <class T, class U>
T narrow(U u) {
    T t = narrow_cast<T>(u);

    if (static_cast<U>(t) != u) {
        throw narrowing_error();
    }
    return t;
}

//
// GSL.views: views
//

//
// at() - Bounds-checked way of accessing static arrays, std::array,
// std::vector.
//

namespace detail {

struct precedence_0 {};
struct precedence_1 : precedence_0 {};
struct order_precedence : precedence_1 {};

template <class Array, class T>
T &at(Array &arr, size_t index, T *, precedence_0 const &) {
    Expects(index < gsl_DIMENSION_OF(arr));
    return arr[index];
}

}  // namespace detail

// Create an at( container ) function:

#define gsl_MK_AT(Cont)                                                    \
    namespace gsl {                                                        \
    namespace detail {                                                     \
    template <class T>                                                     \
    inline T &at(Cont<T> &cont, size_t index, T *, precedence_1 const &) { \
        Expects(index < cont.size());                                      \
        return cont[index];                                                \
    }                                                                      \
    }                                                                      \
    }

template <class Cont>
int &at(Cont &cont, size_t index) {
    return detail::at(cont, index, &cont[0], detail::order_precedence());
}

//
// not_null<> - Wrap any indirection and enforce non-null.
//
template <class T>
class not_null {
public:
    not_null(T t) : ptr_(t) { Expects(ptr_ != NULL); }
    not_null &operator=(T const &t) {
        ptr_ = t;
        Expects(ptr_ != NULL);
        return *this;
    }

    not_null(not_null const &other) : ptr_(other.ptr_) {}
    not_null &operator=(not_null const &other) { ptr_ = other.ptr_; }

    // VC6 accepts this anyway:
    // template< typename U > not_null( not_null<U> const & other );
    // template< typename U > not_null & operator=( not_null<U> const & other ) ;

private:
    // Prevent compilation when initialized with a literal 0:
    not_null(int);
    not_null &operator=(int);

public:
    T get() const { return ptr_; }

    operator T() const { return get(); }
    T operator->() const { return get(); }

    bool operator==(T const &rhs) const { return ptr_ == rhs; }
    bool operator!=(T const &rhs) const { return !(*this == rhs); }

private:
    T ptr_;

    not_null &operator++();
    not_null &operator--();
    not_null operator++(int);
    not_null operator--(int);
    not_null &operator+(size_t);
    not_null &operator+=(size_t);
    not_null &operator-(size_t);
    not_null &operator-=(size_t);
};

//
// Byte-specific type.
//
typedef unsigned char byte;

//
// span<> - A 1D view of contiguous T's, replace (*,len).
//
template <class T>
class span {
public:
    typedef size_t size_type;

    typedef T value_type;
    typedef T &reference;
    typedef T *pointer;
    typedef T const *const_pointer;

    typedef pointer iterator;
    typedef const_pointer const_iterator;

    typedef std::reverse_iterator<iterator, T> reverse_iterator;
    typedef std::reverse_iterator<const_iterator, const T> const_reverse_iterator;

    // Todo:
    // typedef typename std::iterator_traits< iterator >::difference_type
    // difference_type;

    span() : begin_(NULL), end_(NULL) { Expects(size() == 0); }

    span(pointer begin, pointer end) : begin_(begin), end_(end) { Expects(begin <= end); }

    span(pointer data, size_type size) : begin_(data), end_(data + size) {
        Expects(size == 0 || (size > 0 && data != NULL));
    }

private:
    struct precedence_0 {};
    struct precedence_1 : precedence_0 {};
    struct precedence_2 : precedence_1 {};
    struct order_precedence : precedence_1 {};

    template <class Array, class U>
    span create(Array &arr, U *, precedence_0 const &) const {
        return span(arr, gsl_DIMENSION_OF(arr));
    }

    span create(std::vector<T> &cont, T *, precedence_1 const &) const {
        return span(&cont[0], cont.size());
    }

public:
    template <class Cont>
    span(Cont &cont) {
        *this = create(cont, &cont[0], order_precedence());
    }

#if 0
    // =default constructor
    span( span const & other )
        : begin_( other.begin() )
        , end_  ( other.end() )
    {}
#endif

    span &operator=(span const &other) {
        // VC6 balks at copy-swap implementation (here),
        // so we do it the simple way:
        begin_ = other.begin_;
        end_ = other.end_;
        return *this;
    }

#if 0
    // Converting from other span ?
    template< typename U > operator=();
#endif

    iterator begin() const { return iterator(begin_); }

    iterator end() const { return iterator(end_); }

    const_iterator cbegin() const { return const_iterator(begin()); }

    const_iterator cend() const { return const_iterator(end()); }

    reverse_iterator rbegin() const { return reverse_iterator(end()); }

    reverse_iterator rend() const { return reverse_iterator(begin()); }

    const_reverse_iterator crbegin() const { return const_reverse_iterator(cend()); }

    const_reverse_iterator crend() const { return const_reverse_iterator(cbegin()); }

    operator bool() const { return begin_ != NULL; }

    reference operator[](size_type index) { return at(index); }

    bool operator==(span const &other) const {
        return size() == other.size() &&
               (begin_ == other.begin_ || std::equal(this->begin(), this->end(), other.begin()));
    }

    bool operator!=(span const &other) const { return !(*this == other); }

    bool operator<(span const &other) const {
        return std::lexicographical_compare(this->begin(), this->end(), other.begin(), other.end());
    }

    bool operator<=(span const &other) const { return !(other < *this); }

    bool operator>(span const &other) const { return (other < *this); }

    bool operator>=(span const &other) const { return !(*this < other); }

    reference at(size_type index) {
        Expects(index >= 0 && index < size());
        return begin_[index];
    }

    pointer data() const { return begin_; }

    bool empty() const { return size() == 0; }

    size_type size() const { return std::distance(begin_, end_); }

    size_type length() const { return size(); }

    size_type used_length() const { return length(); }

    size_type bytes() const { return sizeof(value_type) * size(); }

    size_type used_bytes() const { return bytes(); }

    void swap(span &other) {
        using std::swap;
        swap(begin_, other.begin_);
        swap(end_, other.end_);
    }

    span<const byte> as_bytes() const {
        return span<const byte>(reinterpret_cast<const byte *>(data()), bytes());
    }

    span<byte> as_writeable_bytes() const {
        return span<byte>(reinterpret_cast<byte *>(data()), bytes());
    }

    template <class U>
    struct mk {
        static span<U> view(U *data, size_type size) { return span<U>(data, size); }
    };

    template <typename U>
    span<U> as_span(U u = U()) const {
        Expects((this->bytes() % sizeof(U)) == 0);
        return mk<U>::view(reinterpret_cast<U *>(this->data()), this->bytes() / sizeof(U));
    }

private:
    pointer begin_;
    pointer end_;
};

// span creator functions (see ctors)

template <typename T>
span<const byte> as_bytes(span<T> spn) {
    return span<const byte>(reinterpret_cast<const byte *>(spn.data()), spn.bytes());
}

template <typename T>
span<byte> as_writeable_bytes(span<T> spn) {
    return span<byte>(reinterpret_cast<byte *>(spn.data()), spn.bytes());
}

template <typename T>
span<T> as_span(T *begin, T *end) {
    return span<T>(begin, end);
}

template <typename T>
span<T> as_span(T *begin, size_t size) {
    return span<T>(begin, size);
}

namespace detail {

template <class T>
struct mk {
    static span<T> view(std::vector<T> &cont) { return span<T>(cont); }
};
}  // namespace detail

template <class T>
span<T> as_span(std::vector<T> &cont) {
    return detail::mk<T>::view(cont);
}

//
// String types:
//

typedef char *zstring;
typedef wchar_t *zwstring;
typedef const char *czstring;
typedef const wchar_t *cwzstring;

typedef span<char> string_span;
typedef span<wchar_t> wstring_span;
typedef span<const char> cstring_span;
typedef span<const wchar_t> cwstring_span;

// to_string() allow (explicit) conversions from string_span to string

inline std::string to_string(string_span const &view) {
    return std::string(view.data(), view.length());
}

inline std::string to_string(cstring_span const &view) {
    return std::string(view.data(), view.length());
}

inline std::wstring to_string(wstring_span const &view) {
    return std::wstring(view.data(), view.length());
}

inline std::wstring to_string(cwstring_span const &view) {
    return std::wstring(view.data(), view.length());
}

//
// ensure_sentinel()
//
// Provides a way to obtain a span from a contiguous sequence
// that ends with a (non-inclusive) sentinel value.
//
// Will fail-fast if sentinel cannot be found before max elements are examined.
//
namespace detail {

template <class T, class SizeType, const T Sentinel>
struct ensure {
    static span<T> sentinel(T *seq, SizeType max = (std::numeric_limits<SizeType>::max)()) {
        typedef T *pointer;
        typedef typename std::iterator_traits<pointer>::difference_type difference_type;

        pointer cur = seq;

        while (std::distance(seq, cur) < static_cast<difference_type>(max) && *cur != Sentinel)
            ++cur;

        Expects(*cur == Sentinel);

        return span<T>(seq, cur - seq);
    }
};
}  // namespace detail

//
// ensure_z - creates a string_span for a czstring or cwzstring.
// Will fail fast if a null-terminator cannot be found before
// the limit of size_type.
//

template <typename T>
span<T> ensure_z(T *sz, size_t max = (std::numeric_limits<size_t>::max)()) {
    return detail::ensure<T, size_t, 0>::sentinel(sz, max);
}

}  // namespace gsl

// at( std::vector ):

gsl_MK_AT(std::vector)

#endif  // GSL_GSL_LITE_H_INCLUDED

        // end of file


================================================
FILE: third_party/include/gsl/gsl-lite.h
================================================
//
// gsl-lite is based on GSL: Guidelines Support Library.
// For more information see https://github.com/gsl-lite/gsl-lite
//
// Copyright (c) 2015 Martin Moene
// Copyright (c) 2015 Microsoft Corporation. All rights reserved.
//
// This code is licensed under the MIT License (MIT).
//
// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
// IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
// FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
// AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
// LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
// OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
// THE SOFTWARE.

// mimic MS include hierarchy

#ifndef GSL_GSL_LITE_H_INCLUDED
#define GSL_GSL_LITE_H_INCLUDED

#pragma message("gsl/gsl-lite.h is deprecated since version 0.27.0, use gsl/gsl-lite.hpp instead.")

#include "gsl-lite.hpp"

#endif  // GSL_GSL_LITE_H_INCLUDED


================================================
FILE: third_party/include/gsl/gsl-lite.hpp
================================================
//
// gsl-lite is based on GSL: Guidelines Support Library.
// For more information see https://github.com/gsl-lite/gsl-lite
//
// Copyright (c) 2015-2019 Martin Moene
// Copyright (c) 2019-2021 Moritz Beutel
// Copyright (c) 2015-2018 Microsoft Corporation. All rights reserved.
//
// This code is licensed under the MIT License (MIT).
//
// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
// IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
// FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
// AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
// LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
// OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
// THE SOFTWARE.

#ifndef GSL_GSL_LITE_HPP_INCLUDED
#define GSL_GSL_LITE_HPP_INCLUDED

#include <cstddef>    // for size_t, ptrdiff_t, nullptr_t
#include <exception>  // for exception, terminate(), uncaught_exceptions()
#include <ios>        // for ios_base, streamsize
#include <iosfwd>     // for basic_ostream<>
#include <limits>
#include <memory>     // for addressof(), unique_ptr<>, shared_ptr<>
#include <stdexcept>  // for logic_error
#include <string>
#include <utility>  // for move(), forward<>(), swap()

#define gsl_lite_MAJOR 0
#define gsl_lite_MINOR 38
#define gsl_lite_PATCH 1

#define gsl_lite_VERSION                                                               \
    gsl_STRINGIFY(gsl_lite_MAJOR) "." gsl_STRINGIFY(gsl_lite_MINOR) "." gsl_STRINGIFY( \
            gsl_lite_PATCH)

#define gsl_STRINGIFY(x) gsl_STRINGIFY_(x)
#define gsl_STRINGIFY_(x) #x
#define gsl_CONCAT_(a, b) gsl_CONCAT2_(a, b)
#define gsl_CONCAT2_(a, b) a##b
#define gsl_EVALF_(f) f()

// configuration argument checking:

#define gsl_DETAIL_CFG_TOGGLE_VALUE_1 1
#define gsl_DETAIL_CFG_TOGGLE_VALUE_0 1
#define gsl_DETAIL_CFG_DEFAULTS_VERSION_VALUE_1 1
#define gsl_DETAIL_CFG_DEFAULTS_VERSION_VALUE_0 1
#define gsl_DETAIL_CFG_STD_VALUE_98 1
#define gsl_DETAIL_CFG_STD_VALUE_3 1
#define gsl_DETAIL_CFG_STD_VALUE_03 1
#define gsl_DETAIL_CFG_STD_VALUE_11 1
#define gsl_DETAIL_CFG_STD_VALUE_14 1
#define gsl_DETAIL_CFG_STD_VALUE_17 1
#define gsl_DETAIL_CFG_STD_VALUE_20 1
#define gsl_DETAIL_CFG_NO_VALUE_ 1
#define gsl_DETAIL_CFG_NO_VALUE_1 \
    1  // many compilers treat the command-line parameter "-Dfoo" as equivalent to \
            // "-Dfoo=1", so we tolerate that
#define gsl_CHECK_CFG_TOGGLE_VALUE_(x) gsl_CONCAT_(gsl_DETAIL_CFG_TOGGLE_VALUE_, x)
#define gsl_CHECK_CFG_DEFAULTS_VERSION_VALUE_(x) \
    gsl_CONCAT_(gsl_DETAIL_CFG_DEFAULTS_VERSION_VALUE_, x)
#define gsl_CHECK_CFG_STD_VALUE_(x) gsl_CONCAT_(gsl_DETAIL_CFG_STD_VALUE_, x)
#define gsl_CHECK_CFG_NO_VALUE_(x) gsl_CONCAT_(gsl_DETAIL_CFG_NO_VALUE, gsl_CONCAT_(_, x))

// gsl-lite backward compatibility:

#if defined(gsl_CONFIG_DEFAULTS_VERSION)
#if !gsl_CHECK_CFG_DEFAULTS_VERSION_VALUE_(gsl_CONFIG_DEFAULTS_VERSION)
#pragma message("invalid configuration value gsl_CONFIG_DEFAULTS_VERSION=" gsl_STRINGIFY( \
        gsl_CONFIG_DEFAULTS_VERSION) ", must be 0 or 1")
#endif
#else
#define gsl_CONFIG_DEFAULTS_VERSION gsl_lite_MAJOR  // default
#endif
#define gsl_CONFIG_DEFAULTS_VERSION_() gsl_CONFIG_DEFAULTS_VERSION

#if defined(gsl_CONFIG_ALLOWS_SPAN_CONTAINER_CTOR)
#if !gsl_CHECK_CFG_TOGGLE_VALUE_(gsl_CONFIG_ALLOWS_SPAN_CONTAINER_CTOR)
#pragma message(                                                                            \
        "invalid configuration value gsl_CONFIG_ALLOWS_SPAN_CONTAINER_CTOR=" gsl_STRINGIFY( \
                gsl_CONFIG_ALLOWS_SPAN_CONTAINER_CTOR) ", must be 0 or 1")
#endif
#define gsl_CONFIG_ALLOWS_UNCONSTRAINED_SPAN_CONTAINER_CTOR gsl_CONFIG_ALLOWS_SPAN_CONTAINER_CTOR
#pragma message( \
        "gsl_CONFIG_ALLOWS_SPAN_CONTAINER_CTOR is deprecated since gsl-lite 0.7; replace with gsl_CONFIG_ALLOWS_UNCONSTRAINED_SPAN_CONTAINER_CTOR, or consider span(with_container, cont).")
#endif

#if defined(gsl_CONFIG_CONTRACT_LEVEL_ON)
#if !gsl_CHECK_CFG_NO_VALUE_(gsl_CONFIG_CONTRACT_LEVEL_ON)
#pragma message("invalid configuration value gsl_CONFIG_CONTRACT_LEVEL_ON=" gsl_STRINGIFY( \
        gsl_CONFIG_CONTRACT_LEVEL_ON) "; macro must be defined without value")
#endif
#pragma message( \
        "gsl_CONFIG_CONTRACT_LEVEL_ON is deprecated since gsl-lite 0.36; replace with gsl_CONFIG_CONTRACT_CHECKING_ON.")
#define gsl_CONFIG_CONTRACT_CHECKING_ON
#endif
#if defined(gsl_CONFIG_CONTRACT_LEVEL_OFF)
#if !gsl_CHECK_CFG_NO_VALUE_(gsl_CONFIG_CONTRACT_LEVEL_OFF)
#pragma message("invalid configuration value gsl_CONFIG_CONTRACT_LEVEL_OFF=" gsl_STRINGIFY( \
        gsl_CONFIG_CONTRACT_LEVEL_OFF) "; macro must be defined without value")
#endif
#pragma message( \
        "gsl_CONFIG_CONTRACT_LEVEL_OFF is deprecated since gsl-lite 0.36; replace with gsl_CONFIG_CONTRACT_CHECKING_OFF.")
#define gsl_CONFIG_CONTRACT_CHECKING_OFF
#endif
#if defined(gsl_CONFIG_CONTRACT_LEVEL_EXPECTS_ONLY)
#if !gsl_CHECK_CFG_NO_VALUE_(gsl_CONFIG_CONTRACT_LEVEL_EXPECTS_ONLY)
#pragma message(                                                                             \
        "invalid configuration value gsl_CONFIG_CONTRACT_LEVEL_EXPECTS_ONLY=" gsl_STRINGIFY( \
                gsl_CONFIG_CONTRACT_LEVEL_EXPECTS_ONLY) "; macro must be defined without value")
#endif
#pragma message( \
        "gsl_CONFIG_CONTRACT_LEVEL_EXPECTS_ONLY is deprecated since gsl-lite 0.36; replace with gsl_CONFIG_CONTRACT_CHECKING_ENSURES_OFF and gsl_CONFIG_CONTRACT_CHECKING_ASSERT_OFF.")
#define gsl_CONFIG_CONTRACT_CHECKING_ON
#define gsl_CONFIG_CONTRACT_CHECKING_ENSURES_OFF
#define gsl_CONFIG_CONTRACT_CHECKING_ASSERT_OFF
#elif defined(gsl_CONFIG_CONTRACT_LEVEL_ENSURES_ONLY)
#if !gsl_CHECK_CFG_NO_VALUE_(gsl_CONFIG_CONTRACT_LEVEL_ENSURES_ONLY)
#pragma message(                                                                             \
        "invalid configuration value gsl_CONFIG_CONTRACT_LEVEL_ENSURES_ONLY=" gsl_STRINGIFY( \
                gsl_CONFIG_CONTRACT_LEVEL_ENSURES_ONLY) "; macro must be defined without value")
#endif
#pragma message( \
        "gsl_CONFIG_CONTRACT_LEVEL_ENSURES_ONLY is deprecated since gsl-lite 0.36; replace with gsl_CONFIG_CONTRACT_CHECKING_EXPECTS_OFF and gsl_CONFIG_CONTRACT_CHECKING_ASSERT_OFF.")
#define gsl_CONFIG_CONTRACT_CHECKING_ON
#define gsl_CONFIG_CONTRACT_CHECKING_EXPECTS_OFF
#define gsl_CONFIG_CONTRACT_CHECKING_ASSERT_OFF
#endif

// M-GSL compatibility:

#if defined(GSL_THROW_ON_CONTRACT_VIOLATION)
#if !gsl_CHECK_CFG_NO_VALUE_(GSL_THROW_ON_CONTRACT_VIOLATION)
#pragma message("invalid configuration value GSL_THROW_ON_CONTRACT_VIOLATION=" gsl_STRINGIFY( \
        GSL_THROW_ON_CONTRACT_VIOLATION) "; macro must be defined without value")
#endif
#define gsl_CONFIG_CONTRACT_VIOLATION_THROWS
#endif

#if defined(GSL_TERMINATE_ON_CONTRACT_VIOLATION)
#if !gsl_CHECK_CFG_NO_VALUE_(GSL_TERMINATE_ON_CONTRACT_VIOLATION)
#pragma message("invalid configuration value GSL_TERMINATE_ON_CONTRACT_VIOLATION=" gsl_STRINGIFY( \
        GSL_TERMINATE_ON_CONTRACT_VIOLATION) "; macro must be defined without value")
#endif
#define gsl_CONFIG_CONTRACT_VIOLATION_TERMINATES
#endif

#if defined(GSL_UNENFORCED_ON_CONTRACT_VIOLATION)
#if !gsl_CHECK_CFG_NO_VALUE_(GSL_UNENFORCED_ON_CONTRACT_VIOLATION)
#pragma message("invalid configuration value GSL_UNENFORCED_ON_CONTRACT_VIOLATION=" gsl_STRINGIFY( \
        GSL_UNENFORCED_ON_CONTRACT_VIOLATION) "; macro must be defined without value")
#endif
#define gsl_CONFIG_CONTRACT_CHECKING_OFF
#endif

// Configuration: Features

#if defined(gsl_FEATURE_WITH_CONTAINER_TO_STD)
#if !gsl_CHECK_CFG_STD_VALUE_(gsl_FEATURE_WITH_CONTAINER_TO_STD)
#pragma message("invalid configuration value gsl_FEATURE_WITH_CONTAINER_TO_STD=" gsl_STRINGIFY( \
        gsl_FEATURE_WITH_CONTAINER_TO_STD) ", must be 98, 3, 11, 14, 17, or 20")
#endif
#else
#define gsl_FEATURE_WITH_CONTAINER_TO_STD 99  // default
#endif
#define gsl_FEATURE_WITH_CONTAINER_TO_STD_() gsl_FEATURE_WITH_CONTAINER_TO_STD

#if defined(gsl_FEATURE_MAKE_SPAN_TO_STD)
#if !gsl_CHECK_CFG_STD_VALUE_(gsl_FEATURE_MAKE_SPAN_TO_STD)
#pragma message("invalid configuration value gsl_FEATURE_MAKE_SPAN_TO_STD=" gsl_STRINGIFY( \
        gsl_FEATURE_MAKE_SPAN_TO_STD) ", must be 98, 3, 11, 14, 17, or 20")
#endif
#else
#define gsl_FEATURE_MAKE_SPAN_TO_STD 99  // default
#endif
#define gsl_FEATURE_MAKE_SPAN_TO_STD_() gsl_FEATURE_MAKE_SPAN_TO_STD

#if defined(gsl_FEATURE_BYTE_SPAN_TO_STD)
#if !gsl_CHECK_CFG_STD_VALUE_(gsl_FEATURE_BYTE_SPAN_TO_STD)
#pragma message("invalid configuration value gsl_FEATURE_BYTE_SPAN_TO_STD=" gsl_STRINGIFY( \
        gsl_FEATURE_BYTE_SPAN_TO_STD) ", must be 98, 3, 11, 14, 17, or 20")
#endif
#else
#define gsl_FEATURE_BYTE_SPAN_TO_STD 99  // default
#endif
#define gsl_FEATURE_BYTE_SPAN_TO_STD_() gsl_FEATURE_BYTE_SPAN_TO_STD

#if defined(gsl_FEATURE_IMPLICIT_MACRO)
#if !gsl_CHECK_CFG_TOGGLE_VALUE_(gsl_FEATURE_IMPLICIT_MACRO)
#pragma message("invalid configuration value gsl_FEATURE_IMPLICIT_MACRO=" gsl_STRINGIFY( \
        gsl_FEATURE_IMPLICIT_MACRO) ", must be 0 or 1")
#endif
#else
#define gsl_FEATURE_IMPLICIT_MACRO 0  // default
#endif
#define gsl_FEATURE_IMPLICIT_MACRO_() gsl_FEATURE_IMPLICIT_MACRO

#if defined(gsl_FEATURE_OWNER_MACRO)
#if !gsl_CHECK_CFG_TOGGLE_VALUE_(gsl_FEATURE_OWNER_MACRO)
#pragma message("invalid configuration value gsl_FEATURE_OWNER_MACRO=" gsl_STRINGIFY( \
        gsl_FEATURE_OWNER_MACRO) ", must be 0 or 1")
#endif
#else
#define gsl_FEATURE_OWNER_MACRO (gsl_CONFIG_DEFAULTS_VERSION == 0)  // default
#endif
#define gsl_FEATURE_OWNER_MACRO_() gsl_FEATURE_OWNER_MACRO

#if defined(gsl_FEATURE_EXPERIMENTAL_RETURN_GUARD)
#if !gsl_CHECK_CFG_TOGGLE_VALUE_(gsl_FEATURE_EXPERIMENTAL_RETURN_GUARD)
#pragma message(                                                                            \
        "invalid configuration value gsl_FEATURE_EXPERIMENTAL_RETURN_GUARD=" gsl_STRINGIFY( \
                gsl_FEATURE_EXPERIMENTAL_RETURN_GUARD) ", must be 0 or 1")
#endif
#else
#define gsl_FEATURE_EXPERIMENTAL_RETURN_GUARD 0  // default
#endif
#define gsl_FEATURE_EXPERIMENTAL_RETURN_GUARD_() gsl_FEATURE_EXPERIMENTAL_RETURN_GUARD

#if defined(gsl_FEATURE_GSL_LITE_NAMESPACE)
#if !gsl_CHECK_CFG_TOGGLE_VALUE_(gsl_FEATURE_GSL_LITE_NAMESPACE)
#pragma message("invalid configuration value gsl_FEATURE_GSL_LITE_NAMESPACE=" gsl_STRINGIFY( \
        gsl_FEATURE_GSL_LITE_NAMESPACE) ", must be 0 or 1")
#endif
#else
#define gsl_FEATURE_GSL_LITE_NAMESPACE (gsl_CONFIG_DEFAULTS_VERSION >= 1)  // default
#endif
#define gsl_FEATURE_GSL_LITE_NAMESPACE_() gsl_FEATURE_GSL_LITE_NAMESPACE

// Configuration: Other

#if defined(gsl_CONFIG_TRANSPARENT_NOT_NULL)
#if !gsl_CHECK_CFG_TOGGLE_VALUE_(gsl_CONFIG_TRANSPARENT_NOT_NULL)
#pragma message("invalid configuration value gsl_CONFIG_TRANSPARENT_NOT_NULL=" gsl_STRINGIFY( \
        gsl_CONFIG_TRANSPARENT_NOT_NULL) ", must be 0 or 1")
#endif
#if gsl_CONFIG_TRANSPARENT_NOT_NULL && defined(gsl_CONFIG_NOT_NULL_GET_BY_CONST_REF)
#error configuration option gsl_CONFIG_NOT_NULL_GET_BY_CONST_REF is meaningless if gsl_CONFIG_TRANSPARENT_NOT_NULL=1
#endif
#else
#define gsl_CONFIG_TRANSPARENT_NOT_NULL (gsl_CONFIG_DEFAULTS_VERSION >= 1)  // default
#endif
#define gsl_CONFIG_TRANSPARENT_NOT_NULL_() gsl_CONFIG_TRANSPARENT_NOT_NULL

#if !defined(gsl_CONFIG_DEPRECATE_TO_LEVEL)
#if gsl_CONFIG_DEFAULTS_VERSION >= 1
#define gsl_CONFIG_DEPRECATE_TO_LEVEL 6
#else
#define gsl_CONFIG_DEPRECATE_TO_LEVEL 0
#endif
#endif

#if !defined(gsl_CONFIG_SPAN_INDEX_TYPE)
#define gsl_CONFIG_SPAN_INDEX_TYPE std::size_t
#endif
#define gsl_CONFIG_SPAN_INDEX_TYPE_() gsl_CONFIG_SPAN_INDEX_TYPE

#if !defined(gsl_CONFIG_INDEX_TYPE)
#if gsl_CONFIG_DEFAULTS_VERSION >= 1
// p0122r3 uses std::ptrdiff_t
#define gsl_CONFIG_INDEX_TYPE std::ptrdiff_t
#else
#define gsl_CONFIG_INDEX_TYPE gsl_CONFIG_SPAN_INDEX_TYPE
#endif
#endif
#define gsl_CONFIG_INDEX_TYPE_() gsl_CONFIG_INDEX_TYPE

#if defined(gsl_CONFIG_NOT_NULL_EXPLICIT_CTOR)
#if !gsl_CHECK_CFG_TOGGLE_VALUE_(gsl_CONFIG_NOT_NULL_EXPLICIT_CTOR)
#pragma message("invalid configuration value gsl_CONFIG_NOT_NULL_EXPLICIT_CTOR=" gsl_STRINGIFY( \
        gsl_CONFIG_NOT_NULL_EXPLICIT_CTOR) ", must be 0 or 1")
#endif
#else
#define gsl_CONFIG_NOT_NULL_EXPLICIT_CTOR (gsl_CONFIG_DEFAULTS_VERSION >= 1)  // default
#endif
#define gsl_CONFIG_NOT_NULL_EXPLICIT_CTOR_() gsl_CONFIG_NOT_NULL_EXPLICIT_CTOR

#if defined(gsl_CONFIG_NOT_NULL_GET_BY_CONST_REF)
#if !gsl_CHECK_CFG_TOGGLE_VALUE_(gsl_CONFIG_NOT_NULL_GET_BY_CONST_REF)
#pragma message("invalid configuration value gsl_CONFIG_NOT_NULL_GET_BY_CONST_REF=" gsl_STRINGIFY( \
        gsl_CONFIG_NOT_NULL_GET_BY_CONST_REF) ", must be 0 or 1")
#endif
#else
#define gsl_CONFIG_NOT_NULL_GET_BY_CONST_REF 0  // default
#endif
#define gsl_CONFIG_NOT_NULL_GET_BY_CONST_REF_() gsl_CONFIG_NOT_NULL_GET_BY_CONST_REF

#if defined(gsl_CONFIG_CONFIRMS_COMPILATION_ERRORS)
#if !gsl_CHECK_CFG_TOGGLE_VALUE_(gsl_CONFIG_CONFIRMS_COMPILATION_ERRORS)
#pragma message(                                                                             \
        "invalid configuration value gsl_CONFIG_CONFIRMS_COMPILATION_ERRORS=" gsl_STRINGIFY( \
                gsl_CONFIG_CONFIRMS_COMPILATION_ERRORS) ", must be 0 or 1")
#endif
#else
#define gsl_CONFIG_CONFIRMS_COMPILATION_ERRORS 0  // default
#endif
#define gsl_CONFIG_CONFIRMS_COMPILATION_ERRORS_() gsl_CONFIG_CONFIRMS_COMPILATION_ERRORS

#if defined(gsl_CONFIG_ALLOWS_SPAN_COMPARISON)
#if !gsl_CHECK_CFG_TOGGLE_VALUE_(gsl_CONFIG_ALLOWS_SPAN_COMPARISON)
#pragma message("invalid configuration value gsl_CONFIG_ALLOWS_SPAN_COMPARISON=" gsl_STRINGIFY( \
        gsl_CONFIG_ALLOWS_SPAN_COMPARISON) ", must be 0 or 1")
#endif
#else
#define gsl_CONFIG_ALLOWS_SPAN_COMPARISON (gsl_CONFIG_DEFAULTS_VERSION == 0)  // default
#endif
#define gsl_CONFIG_ALLOWS_SPAN_COMPARISON_() gsl_CONFIG_ALLOWS_SPAN_COMPARISON

#if defined(gsl_CONFIG_ALLOWS_NONSTRICT_SPAN_COMPARISON)
#if !gsl_CHECK_CFG_TOGGLE_VALUE_(gsl_CONFIG_ALLOWS_NONSTRICT_SPAN_COMPARISON)
#pragma message(                                                                                  \
        "invalid configuration value gsl_CONFIG_ALLOWS_NONSTRICT_SPAN_COMPARISON=" gsl_STRINGIFY( \
                gsl_CONFIG_ALLOWS_NONSTRICT_SPAN_COMPARISON) ", must be 0 or 1")
#endif
#else
#define gsl_CONFIG_ALLOWS_NONSTRICT_SPAN_COMPARISON 1  // default
#endif
#define gsl_CONFIG_ALLOWS_NONSTRICT_SPAN_COMPARISON_() gsl_CONFIG_ALLOWS_NONSTRICT_SPAN_COMPARISON

#if defined(gsl_CONFIG_ALLOWS_UNCONSTRAINED_SPAN_CONTAINER_CTOR)
#if !gsl_CHECK_CFG_TOGGLE_VALUE_(gsl_CONFIG_ALLOWS_UNCONSTRAINED_SPAN_CONTAINER_CTOR)
#pragma message(                                                                                          \
        "invalid configuration value gsl_CONFIG_ALLOWS_UNCONSTRAINED_SPAN_CONTAINER_CTOR=" gsl_STRINGIFY( \
                gsl_CONFIG_ALLOWS_UNCONSTRAINED_SPAN_CONTAINER_CTOR) ", must be 0 or 1")
#endif
#else
#define gsl_CONFIG_ALLOWS_UNCONSTRAINED_SPAN_CONTAINER_CTOR 0  // default
#endif
#define gsl_CONFIG_ALLOWS_UNCONSTRAINED_SPAN_CONTAINER_CTOR_() \
    gsl_CONFIG_ALLOWS_UNCONSTRAINED_SPAN_CONTAINER_CTOR

#if defined(gsl_CONFIG_NARROW_THROWS_ON_TRUNCATION)
#if !gsl_CHECK_CFG_TOGGLE_VALUE_(gsl_CONFIG_NARROW_THROWS_ON_TRUNCATION)
#pragma message(                                                                             \
        "invalid configuration value gsl_CONFIG_NARROW_THROWS_ON_TRUNCATION=" gsl_STRINGIFY( \
                gsl_CONFIG_NARROW_THROWS_ON_TRUNCATION) ", must be 0 or 1")
#endif
#else
#define gsl_CONFIG_NARROW_THROWS_ON_TRUNCATION (gsl_CONFIG_DEFAULTS_VERSION >= 1)  // default
#endif
#define gsl_CONFIG_NARROW_THROWS_ON_TRUNCATION_() gsl_CONFIG_NARROW_THROWS_ON_TRUNCATION

#if defined(gsl_CONFIG_CONTRACT_CHECKING_EXPECTS_OFF)
#if !gsl_CHECK_CFG_NO_VALUE_(gsl_CONFIG_CONTRACT_CHECKING_EXPECTS_OFF)
#pragma message(                                                                               \
        "invalid configuration value gsl_CONFIG_CONTRACT_CHECKING_EXPECTS_OFF=" gsl_STRINGIFY( \
                gsl_CONFIG_CONTRACT_CHECKING_EXPECTS_OFF) "; macro must be defined without value")
#endif
#endif
#if defined(gsl_CONFIG_CONTRACT_CHECKING_ENSURES_OFF)
#if !gsl_CHECK_CFG_NO_VALUE_(gsl_CONFIG_CONTRACT_CHECKING_ENSURES_OFF)
#pragma message(                                                                               \
        "invalid configuration value gsl_CONFIG_CONTRACT_CHECKING_ENSURES_OFF=" gsl_STRINGIFY( \
                gsl_CONFIG_CONTRACT_CHECKING_ENSURES_OFF) "; macro must be defined without value")
#endif
#endif
#if defined(gsl_CONFIG_CONTRACT_CHECKING_ASSERT_OFF)
#if !gsl_CHECK_CFG_NO_VALUE_(gsl_CONFIG_CONTRACT_CHECKING_ASSERT_OFF)
#pragma message(                                                                              \
        "invalid configuration value gsl_CONFIG_CONTRACT_CHECKING_ASSERT_OFF=" gsl_STRINGIFY( \
                gsl_CONFIG_CONTRACT_CHECKING_ASSERT_OFF) "; macro must be defined without value")
#endif
#endif
#if defined(gsl_CONFIG_CONTRACT_CHECKING_AUDIT)
#if !gsl_CHECK_CFG_NO_VALUE_(gsl_CONFIG_CONTRACT_CHECKING_AUDIT)
#pragma message("invalid configuration value gsl_CONFIG_CONTRACT_CHECKING_AUDIT=" gsl_STRINGIFY( \
        gsl_CONFIG_CONTRACT_CHECKING_AUDIT) "; macro must be defined without value")
#endif
#endif
#if defined(gsl_CONFIG_CONTRACT_CHECKING_ON)
#if !gsl_CHECK_CFG_NO_VALUE_(gsl_CONFIG_CONTRACT_CHECKING_ON)
#pragma message("invalid configuration value gsl_CONFIG_CONTRACT_CHECKING_ON=" gsl_STRINGIFY( \
        gsl_CONFIG_CONTRACT_CHECKING_ON) "; macro must be defined without value")
#endif
#endif
#if defined(gsl_CONFIG_CONTRACT_CHECKING_OFF)
#if !gsl_CHECK_CFG_NO_VALUE_(gsl_CONFIG_CONTRACT_CHECKING_OFF)
#pragma message("invalid configuration value gsl_CONFIG_CONTRACT_CHECKING_OFF=" gsl_STRINGIFY( \
        gsl_CONFIG_CONTRACT_CHECKING_OFF) "; macro must be defined without value")
#endif
#endif
#if defined(gsl_CONFIG_CONTRACT_VIOLATION_THROWS)
#if !gsl_CHECK_CFG_NO_VALUE_(gsl_CONFIG_CONTRACT_VIOLATION_THROWS)
#pragma message("invalid configuration value gsl_CONFIG_CONTRACT_VIOLATION_THROWS=" gsl_STRINGIFY( \
        gsl_CONFIG_CONTRACT_VIOLATION_THROWS) "; macro must be defined without value")
#endif
#endif
#if defined(gsl_CONFIG_CONTRACT_VIOLATION_TERMINATES)
#if !gsl_CHECK_CFG_NO_VALUE_(gsl_CONFIG_CONTRACT_VIOLATION_TERMINATES)
#pragma message(                                                                               \
        "invalid configuration value gsl_CONFIG_CONTRACT_VIOLATION_TERMINATES=" gsl_STRINGIFY( \
                gsl_CONFIG_CONTRACT_VIOLATION_TERMINATES) "; macro must be defined without value")
#endif
#endif
#if defined(gsl_CONFIG_CONTRACT_VIOLATION_ASSERTS)
#if !gsl_CHECK_CFG_NO_VALUE_(gsl_CONFIG_CONTRACT_VIOLATION_ASSERTS)
#pragma message(                                                                            \
        "invalid configuration value gsl_CONFIG_CONTRACT_VIOLATION_ASSERTS=" gsl_STRINGIFY( \
                gsl_CONFIG_CONTRACT_VIOLATION_ASSERTS) "; macro must be defined without value")
#endif
#endif
#if defined(gsl_CONFIG_CONTRACT_VIOLATION_TRAPS)
#if !gsl_CHECK_CFG_NO_VALUE_(gsl_CONFIG_CONTRACT_VIOLATION_TRAPS)
#pragma message("invalid configuration value gsl_CONFIG_CONTRACT_VIOLATION_TRAPS=" gsl_STRINGIFY( \
        gsl_CONFIG_CONTRACT_VIOLATION_TRAPS) "; macro must be defined without value")
#endif
#endif
#if defined(gsl_CONFIG_CONTRACT_VIOLATION_CALLS_HANDLER)
#if !gsl_CHECK_CFG_NO_VALUE_(gsl_CONFIG_CONTRACT_VIOLATION_CALLS_HANDLER)
#pragma message(                                                                                  \
        "invalid configuration value gsl_CONFIG_CONTRACT_VIOLATION_CALLS_HANDLER=" gsl_STRINGIFY( \
                gsl_CONFIG_CONTRACT_VIOLATION_CALLS_HANDLER) "; macro must be defined without value")
#endif
#endif
#if defined(gsl_CONFIG_UNENFORCED_CONTRACTS_ASSUME)
#if !gsl_CHECK_CFG_NO_VALUE_(gsl_CONFIG_UNENFORCED_CONTRACTS_ASSUME)
#pragma message(                                                                             \
        "invalid configuration value gsl_CONFIG_UNENFORCED_CONTRACTS_ASSUME=" gsl_STRINGIFY( \
                gsl_CONFIG_UNENFORCED_CONTRACTS_ASSUME) "; macro must be defined without value")
#endif
#endif
#if defined(gsl_CONFIG_UNENFORCED_CONTRACTS_ELIDE)
#if !gsl_CHECK_CFG_NO_VALUE_(gsl_CONFIG_UNENFORCED_CONTRACTS_ELIDE)
#pragma message(                                                                            \
        "invalid configuration value gsl_CONFIG_UNENFORCED_CONTRACTS_ELIDE=" gsl_STRINGIFY( \
                gsl_CONFIG_UNENFORCED_CONTRACTS_ELIDE) "; macro must be defined without value")
#endif
#endif

#if 1 < defined(gsl_CONFIG_CONTRACT_CHECKING_AUDIT) + defined(gsl_CONFIG_CONTRACT_CHECKING_ON) + \
                defined(gsl_CONFIG_CONTRACT_CHECKING_OFF)
#error only one of gsl_CONFIG_CONTRACT_CHECKING_AUDIT, gsl_CONFIG_CONTRACT_CHECKING_ON, and gsl_CONFIG_CONTRACT_CHECKING_OFF may be defined
#endif
#if 1 < defined(gsl_CONFIG_CONTRACT_VIOLATION_THROWS) +             \
                defined(gsl_CONFIG_CONTRACT_VIOLATION_TERMINATES) + \
                defined(gsl_CONFIG_CONTRACT_VIOLATION_ASSERTS) +    \
                defined(gsl_CONFIG_CONTRACT_VIOLATION_TRAPS) +      \
                defined(gsl_CONFIG_CONTRACT_VIOLATION_CALLS_HANDLER)
#error only one of gsl_CONFIG_CONTRACT_VIOLATION_THROWS, gsl_CONFIG_CONTRACT_VIOLATION_TERMINATES, gsl_CONFIG_CONTRACT_VIOLATION_ASSERTS, gsl_CONFIG_CONTRACT_VIOLATION_TRAPS, and gsl_CONFIG_CONTRACT_VIOLATION_CALLS_HANDLER may be defined
#endif
#if 1 < defined(gsl_CONFIG_UNENFORCED_CONTRACTS_ASSUME) + \
                defined(gsl_CONFIG_UNENFORCED_CONTRACTS_ELIDE)
#error only one of gsl_CONFIG_UNENFORCED_CONTRACTS_ASSUME and gsl_CONFIG_UNENFORCED_CONTRACTS_ELIDE may be defined
#endif

#if 0 == defined(gsl_CONFIG_CONTRACT_CHECKING_AUDIT) + defined(gsl_CONFIG_CONTRACT_CHECKING_ON) + \
                 defined(gsl_CONFIG_CONTRACT_CHECKING_OFF)
// select default
#define gsl_CONFIG_CONTRACT_CHECKING_ON
#endif
#if 0 == defined(gsl_CONFIG_CONTRACT_VIOLATION_THROWS) +             \
                 defined(gsl_CONFIG_CONTRACT_VIOLATION_TERMINATES) + \
                 defined(gsl_CONFIG_CONTRACT_VIOLATION_ASSERTS) +    \
                 defined(gsl_CONFIG_CONTRACT_VIOLATION_TRAPS) +      \
                 defined(gsl_CONFIG_CONTRACT_VIOLATION_CALLS_HANDLER)
// select default
#define gsl_CONFIG_CONTRACT_VIOLATION_TERMINATES
#endif
#if 0 == defined(gsl_CONFIG_UNENFORCED_CONTRACTS_ASSUME) + \
                 defined(gsl_CONFIG_UNENFORCED_CONTRACTS_ELIDE)
// select default
#define gsl_CONFIG_UNENFORCED_CONTRACTS_ELIDE
#endif

// C++ language version detection (C++20 is speculative):
// Note: VC14.0/1900 (VS2015) lacks too much from C++14.

#ifndef gsl_CPLUSPLUS
#if defined(_MSVC_LANG) && !defined(__clang__)
#define gsl_CPLUSPLUS (_MSC_VER == 1900 ? 201103L : _MSVC_LANG)
#else
#define gsl_CPLUSPLUS __cplusplus
#endif
#endif

// C++ standard library version:

#ifndef gsl_CPLUSPLUS_STDLIB
#define gsl_CPLUSPLUS_STDLIB gsl_CPLUSPLUS
#endif

#define gsl_CPP98_OR_GREATER (gsl_CPLUSPLUS >= 199711L)
#define gsl_CPP11_OR_GREATER (gsl_CPLUSPLUS >= 201103L)
#define gsl_CPP14_OR_GREATER (gsl_CPLUSPLUS >= 201402L)
#define gsl_CPP17_OR_GREATER (gsl_CPLUSPLUS >= 201703L)
#define gsl_CPP20_OR_GREATER (gsl_CPLUSPLUS >= 202000L)

// C++ language version (represent 98 as 3):

#define gsl_CPLUSPLUS_V (gsl_CPLUSPLUS / 100 - (gsl_CPLUSPLUS > 200000 ? 2000 : 1994))

// half-open range [lo..hi):
#define gsl_BETWEEN(v, lo, hi) ((lo) <= (v) && (v) < (hi))

// Compiler versions:

// MSVC++  6.0  _MSC_VER == 1200  gsl_COMPILER_MSVC_VERSION ==  60  (Visual
// Studio 6.0) MSVC++  7.0  _MSC_VER == 1300  gsl_COMPILER_MSVC_VERSION ==  70
// (Visual Studio .NET 2002) MSVC++  7.1  _MSC_VER == 1310
// gsl_COMPILER_MSVC_VERSION ==  71  (Visual Studio .NET 2003) MSVC++  8.0
// _MSC_VER == 1400  gsl_COMPILER_MSVC_VERSION ==  80  (Visual Studio 2005)
// MSVC++  9.0  _MSC_VER == 1500  gsl_COMPILER_MSVC_VERSION ==  90  (Visual
// Studio 2008) MSVC++ 10.0  _MSC_VER == 1600  gsl_COMPILER_MSVC_VERSION == 100
// (Visual Studio 2010) MSVC++ 11.0  _MSC_VER == 1700  gsl_COMPILER_MSVC_VERSION
// == 110  (Visual Studio 2012) MSVC++ 12.0  _MSC_VER == 1800
// gsl_COMPILER_MSVC_VERSION == 120  (Visual Studio 2013) MSVC++ 14.0  _MSC_VER
// == 1900  gsl_COMPILER_MSVC_VERSION == 140  (Visual Studio 2015) MSVC++ 14.1
// _MSC_VER >= 1910  gsl_COMPILER_MSVC_VERSION == 141  (Visual Studio 2017)
// MSVC++ 14.2  _MSC_VER >= 1920  gsl_COMPILER_MSVC_VERSION == 142  (Visual
// Studio 2019)

#if defined(_MSC_VER) && !defined(__clang__)
#define gsl_COMPILER_MSVC_VER (_MSC_VER)
#define gsl_COMPILER_MSVC_VERSION (_MSC_VER / 10 - 10 * (5 + (_MSC_VER < 1900)))
#define gsl_COMPILER_MSVC_VERSION_FULL (_MSC_VER - 100 * (5 + (_MSC_VER < 1900)))
#else
#define gsl_COMPILER_MSVC_VER 0
#define gsl_COMPILER_MSVC_VERSION 0
#define gsl_COMPILER_MSVC_VERSION_FULL 0
#endif

#define gsl_COMPILER_VERSION(major, minor, patch) (10 * (10 * (major) + (minor)) + (patch))

// AppleClang  7.0.0  __apple_build_version__ ==  7000172
// gsl_COMPILER_APPLECLANG_VERSION ==  700  (Xcode 7.0, 7.0.1) (LLVM  3.7.0)
// AppleClang  7.0.0  __apple_build_version__ ==  7000176
// gsl_COMPILER_APPLECLANG_VERSION ==  700  (Xcode 7.1) (LLVM  3.7.0) AppleClang
// 7.0.2  __apple_build_version__ ==  7000181  gsl_COMPILER_APPLECLANG_VERSION
// ==  702  (Xcode 7.2, 7.2.1)               (LLVM  3.7.0) AppleClang  7.3.0
// __apple_build_version__ ==  7030029  gsl_COMPILER_APPLECLANG_VERSION ==  730
// (Xcode 7.3)                      (LLVM  3.8.0) AppleClang  7.3.0
// __apple_build_version__ ==  7030031  gsl_COMPILER_APPLECLANG_VERSION ==  730
// (Xcode 7.3.1)                    (LLVM  3.8.0) AppleClang  8.0.0
// __apple_build_version__ ==  8000038  gsl_COMPILER_APPLECLANG_VERSION ==  800
// (Xcode 8.0)                      (LLVM  3.9.0) AppleClang  8.0.0
// __apple_build_version__ ==  8000042  gsl_COMPILER_APPLECLANG_VERSION ==  800
// (Xcode 8.1, 8.2, 8.2.1)          (LLVM  3.9.0) AppleClang  8.1.0
// __apple_build_version__ ==  8020038  gsl_COMPILER_APPLECLANG_VERSION ==  810
// (Xcode 8.3)                      (LLVM  3.9.0) AppleClang  8.1.0
// __apple_build_version__ ==  8020041  gsl_COMPILER_APPLECLANG_VERSION ==  810
// (Xcode 8.3.1)                    (LLVM  3.9.0) AppleClang  8.1.0
// __apple_build_version__ ==  8020042  gsl_COMPILER_APPLECLANG_VERSION ==  810
// (Xcode 8.3.2, 8.3.3)             (LLVM  3.9.0) AppleClang  9.0.0
// __apple_build_version__ ==  9000037  gsl_COMPILER_APPLECLANG_VERSION ==  900
// (Xcode 9.0)                      (LLVM  4.0.0) AppleClang  9.0.0
// __apple_build_version__ ==  9000038  gsl_COMPILER_APPLECLANG_VERSION ==  900
// (Xcode 9.1)                      (LLVM  4.0.0) AppleClang  9.0.0
// __apple_build_version__ ==  9000039  gsl_COMPILER_APPLECLANG_VERSION ==  900
// (Xcode 9.2)                      (LLVM  4.0.0) AppleClang  9.1.0
// __apple_build_version__ ==  9020039  gsl_COMPILER_APPLECLANG_VERSION ==  910
// (Xcode 9.3, 9.3.1)               (LLVM  5.0.2) AppleClang  9.1.0
// __apple_build_version__ ==  9020039  gsl_COMPILER_APPLECLANG_VERSION ==  910
// (Xcode 9.4, 9.4.1)               (LLVM  5.0.2) AppleClang 10.0.0
// __apple_build_version__ == 10001145  gsl_COMPILER_APPLECLANG_VERSION == 1000
// (Xcode 10.0, 10.1)               (LLVM  6.0.1) AppleClang 10.0.1
// __apple_build_version__ == 10010046  gsl_COMPILER_APPLECLANG_VERSION == 1001
// (Xcode 10.2, 10.2.1, 10.3)       (LLVM  7.0.0) AppleClang 11.0.0
// __apple_build_version__ == 11000033  gsl_COMPILER_APPLECLANG_VERSION == 1100
// (Xcode 11.1, 11.2, 11.3, 11.3.1) (LLVM  8.0.0) AppleClang 11.0.3
// __apple_build_version__ == 11030032  gsl_COMPILER_APPLECLANG_VERSION == 1103
// (Xcode 11.4, 11.4.1, 11.5, 11.6) (LLVM  9.0.0) AppleClang 12.0.0
// __apple_build_version__ == 12000032  gsl_COMPILER_APPLECLANG_VERSION == 1200
// (Xcode 12.0–12.4)                (LLVM 10.0.0) AppleClang 12.0.5
// __apple_build_version__ == 12050022  gsl_COMPILER_APPLECLANG_VERSION == 1205
// (Xcode 12.5)                     (LLVM 10.0.0)

#if defined(__apple_build_version__)
#define gsl_COMPILER_APPLECLANG_VERSION \
    gsl_COMPILER_VERSION(__clang_major__, __clang_minor__, __clang_patchlevel__)
#define gsl_COMPILER_CLANG_VERSION 0
#elif defined(__clang__)
#define gsl_COMPILER_APPLECLANG_VERSION 0
#define gsl_COMPILER_CLANG_VERSION \
    gsl_COMPILER_VERSION(__clang_major__, __clang_minor__, __clang_patchlevel__)
#else
#define gsl_COMPILER_APPLECLANG_VERSION 0
#define gsl_COMPILER_CLANG_VERSION 0
#endif

#if defined(__GNUC__) && !defined(__clang__)
#define gsl_COMPILER_GNUC_VERSION \
    gsl_COMPILER_VERSION(__GNUC__, __GNUC_MINOR__, __GNUC_PATCHLEVEL__)
#else
#define gsl_COMPILER_GNUC_VERSION 0
#endif

#if defined(__NVCC__)
#define gsl_COMPILER_NVCC_VERSION (__CUDACC_VER_MAJOR__ * 10 + __CUDACC_VER_MINOR__)
#else
#define gsl_COMPILER_NVCC_VERSION 0
#endif

#if defined(__ARMCC_VERSION)
#define gsl_COMPILER_ARMCC_VERSION (__ARMCC_VERSION / 10000)
#define gsl_COMPILER_ARMCC_VERSION_FULL __ARMCC_VERSION
#else
#define gsl_COMPILER_ARMCC_VERSION 0
#define gsl_COMPILER_ARMCC_VERSION_FULL 0
#endif

// Compiler non-strict aliasing:

#if defined(__clang__) || defined(__GNUC__)
#define gsl_may_alias __attribute__((__may_alias__))
#else
#define gsl_may_alias
#endif

// Presence of gsl, language and library features:

#define gsl_IN_STD(v) (((v) == 98 ? 3 : (v)) >= gsl_CPLUSPLUS_V)

#define gsl_DEPRECATE_TO_LEVEL(level) (level <= gsl_CONFIG_DEPRECATE_TO_LEVEL)
#define gsl_FEATURE_TO_STD(feature) gsl_IN_STD(gsl_FEATURE(feature##_TO_STD))
#define gsl_FEATURE(feature) gsl_EVALF_(gsl_FEATURE_##feature##_)
#define gsl_CONFIG(feature) gsl_EVALF_(gsl_CONFIG_##feature##_)
#define gsl_HAVE(feature) gsl_EVALF_(gsl_HAVE_##feature##_)

// Presence of wide character support:

#ifdef __DJGPP__
#define gsl_HAVE_WCHAR 0
#else
#define gsl_HAVE_WCHAR 1
#endif
#define gsl_HAVE_WCHAR_() gsl_HAVE_WCHAR

// Presence of language & library features:

#if gsl_COMPILER_CLANG_VERSION || gsl_COMPILER_APPLECLANG_VERSION
#ifdef __OBJC__
// There are a bunch of inconsistencies about __EXCEPTIONS and
// __has_feature(cxx_exceptions) in Clang 3.4/3.5/3.6. We're interested in C++
// exceptions, which can be checked by __has_feature(cxx_exceptions) in 3.5+. In
// pre-3.5, __has_feature(cxx_exceptions) can be true if ObjC exceptions are
// enabled, but C++ exceptions are disabled. The recommended way to check is
// `__EXCEPTIONS && __has_feature(cxx_exceptions)`. See
// https://releases.llvm.org/3.6.0/tools/clang/docs/ReleaseNotes.html#the-exceptions-macro
// Note: this is only relevant in Objective-C++, thus the ifdef.
#if __EXCEPTIONS && __has_feature(cxx_exceptions)
#define gsl_HAVE_EXCEPTIONS 1
#else
#define gsl_HAVE_EXCEPTIONS 0
#endif  // __EXCEPTIONS && __has_feature(cxx_exceptions)
#else
// clang-cl doesn't define __EXCEPTIONS for MSVC compatibility (see
// https://reviews.llvm.org/D4065). Neither does Clang in MS-compatiblity mode.
// Let's hope no one tries to build Objective-C++ code using MS-compatibility
// mode or clang-cl.
#if __has_feature(cxx_exceptions)
#define gsl_HAVE_EXCEPTIONS 1
#else
#define gsl_HAVE_EXCEPTIONS 0
#endif
#endif
#elif gsl_COMPILER_GNUC_VERSION
#if gsl_BETWEEN(gsl_COMPILER_GNUC_VERSION, 1, 500)
#ifdef __EXCEPTIONS
#define gsl_HAVE_EXCEPTIONS 1
#else
#define gsl_HAVE_EXCEPTIONS 0
#endif  // __EXCEPTIONS
#else
#ifdef __cpp_exceptions
#define gsl_HAVE_EXCEPTIONS 1
#else
#define gsl_HAVE_EXCEPTIONS 0
#endif  // __cpp_exceptions
#endif  // gsl_BETWEEN(gsl_COMPILER_GNUC_VERSION, 1, 500)
#elif gsl_COMPILER_MSVC_VERSION
#ifdef _CPPUNWIND
#define gsl_HAVE_EXCEPTIONS 1
#else
#define gsl_HAVE_EXCEPTIONS 0
#endif  // _CPPUNWIND
#else
// For all other compilers, assume exceptions are always enabled.
#define gsl_HAVE_EXCEPTIONS 1
#endif
#define gsl_HAVE_EXCEPTIONS_() gsl_HAVE_EXCEPTIONS

#if defined(gsl_CONFIG_CONTRACT_VIOLATION_THROWS) && !gsl_HAVE_EXCEPTIONS
#error Cannot use gsl_CONFIG_CONTRACT_VIOLATION_THROWS if exceptions are disabled.
#endif  // defined( gsl_CONFIG_CONTRACT_VIOLATION_THROWS ) && !gsl_HAVE( \
        // EXCEPTIONS )

#ifdef _HAS_CPP0X
#define gsl_HAS_CPP0X _HAS_CPP0X
#else
#define gsl_HAS_CPP0X 0
#endif

#define gsl_CPP11_100 (gsl_CPP11_OR_GREATER || gsl_COMPILER_MSVC_VER >= 1600)
#define gsl_CPP11_110 (gsl_CPP11_OR_GREATER || gsl_COMPILER_MSVC_VER >= 1700)
#define gsl_CPP11_120 (gsl_CPP11_OR_GREATER || gsl_COMPILER_MSVC_VER >= 1800)
#define gsl_CPP11_140 (gsl_CPP11_OR_GREATER || gsl_COMPILER_MSVC_VER >= 1900)

#define gsl_CPP14_000 (gsl_CPP14_OR_GREATER)
#define gsl_CPP14_120 (gsl_CPP14_OR_GREATER || gsl_COMPILER_MSVC_VER >= 1800)
#define gsl_CPP14_140 (gsl_CPP14_OR_GREATER || gsl_COMPILER_MSVC_VER >= 1900)

#define gsl_CPP17_000 (gsl_CPP17_OR_GREATER)
#define gsl_CPP17_140 (gsl_CPP17_OR_GREATER || gsl_COMPILER_MSVC_VER >= 1900)

#define gsl_CPP11_140_CPP0X_90 (gsl_CPP11_140 || (gsl_COMPILER_MSVC_VER >= 1500 && gsl_HAS_CPP0X))
#define gsl_CPP11_140_CPP0X_100 (gsl_CPP11_140 || (gsl_COMPILER_MSVC_VER >= 1600 && gsl_HAS_CPP0X))

// Presence of C++11 language features:

#define gsl_HAVE_C99_PREPROCESSOR gsl_CPP11_140
#define gsl_HAVE_AUTO gsl_CPP11_100
#define gsl_HAVE_RVALUE_REFERENCE gsl_CPP11_100
#define gsl_HAVE_FUNCTION_REF_QUALIFIER \
    (gsl_CPP11_140 && !gsl_BETWEEN(gsl_COMPILER_GNUC_VERSION, 1, 481))
#define gsl_HAVE_ENUM_CLASS gsl_CPP11_110
#define gsl_HAVE_ALIAS_TEMPLATE gsl_CPP11_120
#define gsl_HAVE_DEFAULT_FUNCTION_TEMPLATE_ARG gsl_CPP11_120
#define gsl_HAVE_EXPLICIT gsl_CPP11_120
#define gsl_HAVE_VARIADIC_TEMPLATE gsl_CPP11_120
#define gsl_HAVE_IS_DELETE gsl_CPP11_120
#define gsl_HAVE_CONSTEXPR_11 gsl_CPP11_140
#define gsl_HAVE_IS_DEFAULT gsl_CPP11_140
#define gsl_HAVE_NOEXCEPT gsl_CPP11_140
#define gsl_HAVE_NORETURN (gsl_CPP11_140 && !gsl_BETWEEN(gsl_COMPILER_GNUC_VERSION, 1, 480))
#define gsl_HAVE_EXPRESSION_SFINAE gsl_CPP11_140
#define gsl_HAVE_OVERRIDE_FINAL gsl_CPP11_110

#define gsl_HAVE_C99_PREPROCESSOR_() gsl_HAVE_C99_PREPROCESSOR
#define gsl_HAVE_AUTO_() gsl_HAVE_AUTO
#define gsl_HAVE_RVALUE_REFERENCE_() gsl_HAVE_RVALUE_REFERENCE
#define gsl_HAVE_FUNCTION_REF_QUALIFIER_() gsl_HAVE_FUNCTION_REF_QUALIFIER
#define gsl_HAVE_ENUM_CLASS_() gsl_HAVE_ENUM_CLASS
#define gsl_HAVE_ALIAS_TEMPLATE_() gsl_HAVE_ALIAS_TEMPLATE
#define gsl_HAVE_DEFAULT_FUNCTION_TEMPLATE_ARG_() gsl_HAVE_DEFAULT_FUNCTION_TEMPLATE_ARG
#define gsl_HAVE_EXPLICIT_() gsl_HAVE_EXPLICIT
#define gsl_HAVE_VARIADIC_TEMPLATE_() gsl_HAVE_VARIADIC_TEMPLATE
#define gsl_HAVE_IS_DELETE_() gsl_HAVE_IS_DELETE
#define gsl_HAVE_CONSTEXPR_11_() gsl_HAVE_CONSTEXPR_11
#define gsl_HAVE_IS_DEFAULT_() gsl_HAVE_IS_DEFAULT
#define gsl_HAVE_NOEXCEPT_() gsl_HAVE_NOEXCEPT
#define gsl_HAVE_NORETURN_() gsl_HAVE_NORETURN
#define gsl_HAVE_EXPRESSION_SFINAE_() gsl_HAVE_EXPRESSION_SFINAE
#define gsl_HAVE_OVERRIDE_FINAL_() gsl_HAVE_OVERRIDE_FINAL

// Presence of C++14 language features:

#define gsl_HAVE_CONSTEXPR_14 (gsl_CPP14_000 && !gsl_BETWEEN(gsl_COMPILER_GNUC_VERSION, 1, 600))
#define gsl_HAVE_DECLTYPE_AUTO gsl_CPP14_140
#define gsl_HAVE_DEPRECATED (gsl_CPP14_140 && !gsl_BETWEEN(gsl_COMPILER_MSVC_VERSION, 1, 142))

#define gsl_HAVE_CONSTEXPR_14_() gsl_HAVE_CONSTEXPR_14
#define gsl_HAVE_DECLTYPE_AUTO_() gsl_HAVE_DECLTYPE_AUTO
#define gsl_HAVE_DEPRECATED_() gsl_HAVE_DEPRECATED

// Presence of C++17 language features:
// MSVC: template parameter deduction guides since Visual Studio 2017 v15.7

#define gsl_HAVE_ENUM_CLASS_CONSTRUCTION_FROM_UNDERLYING_TYPE gsl_CPP17_000
#define gsl_HAVE_DEDUCTION_GUIDES \
    (gsl_CPP17_000 && !gsl_BETWEEN(gsl_COMPILER_MSVC_VERSION_FULL, 1, 1414))
#define gsl_HAVE_NODISCARD gsl_CPP17_000
#define gsl_HAVE_CONSTEXPR_17 gsl_CPP17_OR_GREATER

#define gsl_HAVE_ENUM_CLASS_CONSTRUCTION_FROM_UNDERLYING_TYPE_() \
    gsl_HAVE_ENUM_CLASS_CONSTRUCTION_FROM_UNDERLYING_TYPE
#define gsl_HAVE_DEDUCTION_GUIDES_() gsl_HAVE_DEDUCTION_GUIDES
#define gsl_HAVE_NODISCARD_() gsl_HAVE_NODISCARD
#define gsl_HAVE_CONSTEXPR_17_() gsl_HAVE_CONSTEXPR_17

// Presence of C++20 language features:

#define gsl_HAVE_CONSTEXPR_20 gsl_CPP20_OR_GREATER

#define gsl_HAVE_CONSTEXPR_20_() gsl_HAVE_CONSTEXPR_20

// Presence of C++ library features:

#if gsl_BETWEEN(gsl_COMPILER_ARMCC_VERSION, 1, 600)
// Some versions of the ARM compiler apparently ship without a C++11 standard
// library despite having some C++11 support.
#define gsl_STDLIB_CPP98_OR_GREATER gsl_CPP98_OR_GREATER
#define gsl_STDLIB_CPP11_OR_GREATER 0
#define gsl_STDLIB_CPP14_OR_GREATER 0
#define gsl_STDLIB_CPP17_OR_GREATER 0
#define gsl_STDLIB_CPP20_OR_GREATER 0
#else
#define gsl_STDLIB_CPP98_OR_GREATER gsl_CPP98_OR_GREATER
#define gsl_STDLIB_CPP11_OR_GREATER gsl_CPP11_OR_GREATER
#define gsl_STDLIB_CPP14_OR_GREATER gsl_CPP14_OR_GREATER
#define gsl_STDLIB_CPP17_OR_GREATER gsl_CPP17_OR_GREATER
#define gsl_STDLIB_CPP20_OR_GREATER gsl_CPP20_OR_GREATER
#endif

#define gsl_STDLIB_CPP11_100 (gsl_STDLIB_CPP11_OR_GREATER || gsl_COMPILER_MSVC_VER >= 1600)
#define gsl_STDLIB_CPP11_110 (gsl_STDLIB_CPP11_OR_GREATER || gsl_COMPILER_MSVC_VER >= 1700)
#define gsl_STDLIB_CPP11_120 (gsl_STDLIB_CPP11_OR_GREATER || gsl_COMPILER_MSVC_VER >= 1800)
#define gsl_STDLIB_CPP11_140 (gsl_STDLIB_CPP11_OR_GREATER || gsl_COMPILER_MSVC_VER >= 1900)

#define gsl_STDLIB_CPP14_000 (gsl_STDLIB_CPP14_OR_GREATER)
#define gsl_STDLIB_CPP14_120 (gsl_STDLIB_CPP14_OR_GREATER || gsl_COMPILER_MSVC_VER >= 1800)
#define gsl_STDLIB_CPP14_140 (gsl_STDLIB_CPP14_OR_GREATER || gsl_COMPILER_MSVC_VER >= 1900)

#define gsl_STDLIB_CPP17_000 (gsl_STDLIB_CPP17_OR_GREATER)
#define gsl_STDLIB_CPP17_140 (gsl_STDLIB_CPP17_OR_GREATER || gsl_COMPILER_MSVC_VER >= 1900)

#define gsl_STDLIB_CPP11_140_CPP0X_90 \
    (gsl_STDLIB_CPP11_140 || (gsl_COMPILER_MSVC_VER >= 1500 && gsl_HAS_CPP0X))
#define gsl_STDLIB_CPP11_140_CPP0X_100 \
    (gsl_STDLIB_CPP11_140 || (gsl_COMPILER_MSVC_VER >= 1600 && gsl_HAS_CPP0X))

#define gsl_HAVE_ADDRESSOF gsl_STDLIB_CPP17_000
#define gsl_HAVE_ARRAY gsl_STDLIB_CPP11_110
#define gsl_HAVE_TYPE_TRAITS gsl_STDLIB_CPP11_110
#define gsl_HAVE_TR1_TYPE_TRAITS gsl_STDLIB_CPP11_110
#define gsl_HAVE_CONTAINER_DATA_METHOD gsl_STDLIB_CPP11_140_CPP0X_90
#define gsl_HAVE_STD_DATA gsl_STDLIB_CPP17_000
#ifdef __cpp_lib_ssize
#define gsl_HAVE_STD_SSIZE 1
#else
#define gsl_HAVE_STD_SSIZE (gsl_COMPILER_GNUC_VERSION >= 1000 && __cplusplus > 201703L)
#endif
#define gsl_HAVE_HASH gsl_STDLIB_CPP11_120
#define gsl_HAVE_SIZED_TYPES gsl_STDLIB_CPP11_140
#define gsl_HAVE_MAKE_SHARED gsl_STDLIB_CPP11_140_CPP0X_100
#define gsl_HAVE_SHARED_PTR gsl_STDLIB_CPP11_140_CPP0X_100
#define gsl_HAVE_UNIQUE_PTR gsl_STDLIB_CPP11_140_CPP0X_100
#define gsl_HAVE_MAKE_UNIQUE gsl_STDLIB_CPP14_120
#define gsl_HAVE_MOVE_FORWARD gsl_STDLIB_CPP11_100
#define gsl_HAVE_NULLPTR gsl_STDLIB_CPP11_100
#define gsl_HAVE_UNCAUGHT_EXCEPTIONS gsl_STDLIB_CPP17_140
#define gsl_HAVE_ADD_CONST gsl_HAVE_TYPE_TRAITS
#define gsl_HAVE_INITIALIZER_LIST gsl_STDLIB_CPP11_120
#define gsl_HAVE_INTEGRAL_CONSTANT gsl_HAVE_TYPE_TRAITS
#define gsl_HAVE_REMOVE_CONST gsl_HAVE_TYPE_TRAITS
#define gsl_HAVE_REMOVE_REFERENCE gsl_HAVE_TYPE_TRAITS
#define gsl_HAVE_REMOVE_CVREF gsl_STDLIB_CPP20_OR_GREATER
#define gsl_HAVE_TR1_ADD_CONST gsl_HAVE_TR1_TYPE_TRAITS
#define gsl_HAVE_TR1_INTEGRAL_CONSTANT gsl_HAVE_TR1_TYPE_TRAITS
#define gsl_HAVE_TR1_REMOVE_CONST gsl_HAVE_TR1_TYPE_TRAITS
#define gsl_HAVE_TR1_REMOVE_REFERENCE gsl_HAVE_TR1_TYPE_TRAITS

#define gsl_HAVE_ADDRESSOF_() gsl_HAVE_ADDRESSOF
#define gsl_HAVE_ARRAY_() gsl_HAVE_ARRAY
#define gsl_HAVE_TYPE_TRAITS_() gsl_HAVE_TYPE_TRAITS
#define gsl_HAVE_TR1_TYPE_TRAITS_() gsl_HAVE_TR1_TYPE_TRAITS
#define gsl_HAVE_CONTAINER_DATA_METHOD_() gsl_HAVE_CONTAINER_DATA_METHOD
#define gsl_HAVE_HASH_() gsl_HAVE_HASH
#define gsl_HAVE_STD_DATA_() gsl_HAVE_STD_DATA
#define gsl_HAVE_STD_SSIZE_() gsl_HAVE_STD_SSIZE
#define gsl_HAVE_SIZED_TYPES_() gsl_HAVE_SIZED_TYPES
#define gsl_HAVE_MAKE_SHARED_() gsl_HAVE_MAKE_SHARED
#define gsl_HAVE_MOVE_FORWARD_() gsl_HAVE_MOVE_FORWARD
#define gsl_HAVE_NULLPTR_() \
    gsl_HAVE_NULLPTR  // It's a language feature but needs library support, so we \
                      // list it as a library feature.
#define gsl_HAVE_SHARED_PTR_() gsl_HAVE_SHARED_PTR
#define gsl_HAVE_UNIQUE_PTR_() gsl_HAVE_UNIQUE_PTR
#define gsl_HAVE_MAKE_UNIQUE_() gsl_HAVE_MAKE_UNIQUE
#define gsl_HAVE_UNCAUGHT_EXCEPTIONS_() gsl_HAVE_UNCAUGHT_EXCEPTIONS
#define gsl_HAVE_ADD_CONST_() gsl_HAVE_ADD_CONST
#define gsl_HAVE_INITIALIZER_LIST_() \
    gsl_HAVE_INITIALIZER_LIST  // It's a language feature but needs library \
                               // support, so we list it as a library feature.
#define gsl_HAVE_INTEGRAL_CONSTANT_() gsl_HAVE_INTEGRAL_CONSTANT
#define gsl_HAVE_REMOVE_CONST_() gsl_HAVE_REMOVE_CONST
#define gsl_HAVE_REMOVE_REFERENCE_() gsl_HAVE_REMOVE_REFERENCE
#define gsl_HAVE_REMOVE_CVREF_() gsl_HAVE_REMOVE_CVREF
#define gsl_HAVE_TR1_ADD_CONST_() gsl_HAVE_TR1_ADD_CONST
#define gsl_HAVE_TR1_INTEGRAL_CONSTANT_() gsl_HAVE_TR1_INTEGRAL_CONSTANT
#define gsl_HAVE_TR1_REMOVE_CONST_() gsl_HAVE_TR1_REMOVE_CONST
#define gsl_HAVE_TR1_REMOVE_REFERENCE_() gsl_HAVE_TR1_REMOVE_REFERENCE

// C++ feature usage:

#if gsl_HAVE(ADDRESSOF)
#define gsl_ADDRESSOF(x) std::addressof(x)
#else
#define gsl_ADDRESSOF(x) (&x)
#endif

#if gsl_HAVE(CONSTEXPR_11)
#define gsl_constexpr constexpr
#else
#define gsl_constexpr /*constexpr*/
#endif

#if gsl_HAVE(CONSTEXPR_14)
#define gsl_constexpr14 constexpr
#else
#define gsl_constexpr14 /*constexpr*/
#endif

#if gsl_HAVE(CONSTEXPR_17)
#define gsl_constexpr17 constexpr
#else
#define gsl_constexpr17 /*constexpr*/
#endif

#if gsl_HAVE(CONSTEXPR_20)
#define gsl_constexpr20 constexpr
#else
#define gsl_constexpr20 /*constexpr*/
#endif

#if gsl_HAVE(EXPLICIT)
#define gsl_explicit explicit
#else
#define gsl_explicit /*explicit*/
#endif

#if gsl_FEATURE(IMPLICIT_MACRO)
#define implicit /*implicit*/
#endif

#if gsl_HAVE(IS_DELETE)
#define gsl_is_delete = delete
#else
#define gsl_is_delete
#endif

#if gsl_HAVE(IS_DELETE)
#define gsl_is_delete_access public
#else
#define gsl_is_delete_access private
#endif

#if gsl_HAVE(NOEXCEPT)
#define gsl_noexcept noexcept
#define gsl_noexcept_if(expr) noexcept(expr)
#else
#define gsl_noexcept throw()
#define gsl_noexcept_if(expr) /*noexcept( expr )*/
#endif
#if defined(gsl_TESTING_)
#define gsl_noexcept_not_testing
#else
#define gsl_noexcept_not_testing gsl_noexcept
#endif

#if gsl_HAVE(NULLPTR)
#define gsl_nullptr nullptr
#else
#define gsl_nullptr NULL
#endif

#if gsl_HAVE(NODISCARD)
#define gsl_NODISCARD [[nodiscard]]
#else
#define gsl_NODISCARD
#endif

#if gsl_HAVE(NORETURN)
#define gsl_NORETURN [[noreturn]]
#elif defined(_MSC_VER)
#define gsl_NORETURN __declspec(noreturn)
#elif gsl_COMPILER_GNUC_VERSION || gsl_COMPILER_CLANG_VERSION || \
        gsl_COMPILER_APPLECLANG_VERSION || gsl_COMPILER_ARMCC_VERSION
#define gsl_NORETURN __attribute__((noreturn))
#else
#define gsl_NORETURN
#endif

#if gsl_HAVE(DEPRECATED) && !defined(gsl_TESTING_)
#define gsl_DEPRECATED [[deprecated]]
#define gsl_DEPRECATED_MSG(msg) [[deprecated(msg)]]
#else
#define gsl_DEPRECATED
#define gsl_DEPRECATED_MSG(msg)
#endif

#if gsl_HAVE(C99_PREPROCESSOR)
#if gsl_CPP20_OR_GREATER
#define gsl_CONSTRAINT(...) __VA_ARGS__
#else
#define gsl_CONSTRAINT(...) typename
#endif
#endif

#if gsl_HAVE(TYPE_TRAITS)
#define gsl_STATIC_ASSERT_(cond, msg) static_assert(cond, msg)
#else
#define gsl_STATIC_ASSERT_(cond, msg) ((void)sizeof(char[1 - 2 * !!(cond)]))
#endif

#if gsl_HAVE(TYPE_TRAITS)

#define gsl_DEFINE_ENUM_BITMASK_OPERATORS_(ENUM)                                                 \
    gsl_NODISCARD gsl_api inline gsl_constexpr ENUM operator~(ENUM val) gsl_noexcept {           \
        typedef typename ::gsl::std11::underlying_type<ENUM>::type U;                            \
        return ENUM(~U(val));                                                                    \
    }                                                                                            \
    gsl_NODISCARD gsl_api inline gsl_constexpr ENUM operator|(ENUM lhs, ENUM rhs) gsl_noexcept { \
        typedef typename ::gsl::std11::underlying_type<ENUM>::type U;                            \
        return ENUM(U(lhs) | U(rhs));                                                            \
    }                                                                                            \
    gsl_NODISCARD gsl_api inline gsl_constexpr ENUM operator&(ENUM lhs, ENUM rhs) gsl_noexcept { \
        typedef typename ::gsl::std11::underlying_type<ENUM>::type U;                            \
        return ENUM(U(lhs) & U(rhs));                                                            \
    }                                                                                            \
    gsl_NODISCARD gsl_api inline gsl_constexpr ENUM operator^(ENUM lhs, ENUM rhs) gsl_noexcept { \
        typedef typename ::gsl::std11::underlying_type<ENUM>::type U;                            \
        return ENUM(U(lhs) ^ U(rhs));                                                            \
    }                                                                                            \
    gsl_api inline gsl_constexpr14 ENUM &operator|=(ENUM &lhs, ENUM rhs) gsl_noexcept {          \
        return lhs = lhs | rhs;                                                                  \
    }                                                                                            \
    gsl_api inline gsl_constexpr14 ENUM &operator&=(ENUM &lhs, ENUM rhs) gsl_noexcept {          \
        return lhs = lhs & rhs;                                                                  \
    }                                                                                            \
    gsl_api inline gsl_constexpr14 ENUM &operator^=(ENUM &lhs, ENUM rhs) gsl_noexcept {          \
        return lhs = lhs ^ rhs;                                                                  \
    }

#define gsl_DEFINE_ENUM_RELATIONAL_OPERATORS_(ENUM)                                               \
    gsl_NODISCARD gsl_api inline gsl_constexpr bool operator<(ENUM lhs, ENUM rhs) gsl_noexcept {  \
        typedef typename ::gsl::std11::underlying_type<ENUM>::type U;                             \
        return U(lhs) < U(rhs);                                                                   \
    }                                                                                             \
    gsl_NODISCARD gsl_api inline gsl_constexpr bool operator>(ENUM lhs, ENUM rhs) gsl_noexcept {  \
        typedef typename ::gsl::std11::underlying_type<ENUM>::type U;                             \
        return U(lhs) > U(rhs);                                                                   \
    }                                                                                             \
    gsl_NODISCARD gsl_api inline gsl_constexpr bool operator<=(ENUM lhs, ENUM rhs) gsl_noexcept { \
        typedef typename ::gsl::std11::underlying_type<ENUM>::type U;                             \
        return U(lhs) <= U(rhs);                                                                  \
    }                                                                                             \
    gsl_NODISCARD gsl_api inline gsl_constexpr bool operator>=(ENUM lhs, ENUM rhs) gsl_noexcept { \
        typedef typename ::gsl::std11::underlying_type<ENUM>::type U;                             \
        return U(lhs) >= U(rhs);                                                                  \
    }

//
// Defines bitmask operators `|`, `&`, `^`, `~`, `|=`, `&=`, and `^=` for the
// given enum type.
//
//     enum class Vegetables { tomato = 0b001, onion = 0b010, eggplant = 0b100
//     }; gsl_DEFINE_ENUM_BITMASK_OPERATORS( Vegetables )
//
#define gsl_DEFINE_ENUM_BITMASK_OPERATORS(ENUM) gsl_DEFINE_ENUM_BITMASK_OPERATORS_(ENUM)

//
// Defines relational operators `<`, `>`, `<=`, `>=` for the given enum type.
//
//     enum class OperatorPrecedence { additive = 0, multiplicative = 1, power =
//     2 }; gsl_DEFINE_ENUM_RELATIONAL_OPERATORS( OperatorPrecedence )
//
#define gsl_DEFINE_ENUM_RELATIONAL_OPERATORS(ENUM) gsl_DEFINE_ENUM_RELATIONAL_OPERATORS_(ENUM)

#endif  // gsl_HAVE( TYPE_TRAITS )

#define gsl_DIMENSION_OF(a) (sizeof(a) / sizeof(0 [a]))

// Method enabling (C++98, VC120 (VS2013) cannot use __VA_ARGS__)

#if gsl_HAVE(EXPRESSION_SFINAE)
#define gsl_TRAILING_RETURN_TYPE_(T) auto
#define gsl_RETURN_DECLTYPE_(EXPR) ->decltype(EXPR)
#else
#define gsl_TRAILING_RETURN_TYPE_(T) T
#define gsl_RETURN_DECLTYPE_(EXPR)
#endif

// NOTE: When using SFINAE in gsl-lite, please note that overloads of function
// templates must always use SFINAE with non-type default arguments
//       as explained in
//       https://en.cppreference.com/w/cpp/types/enable_if#Notes.
//       `gsl_ENABLE_IF_()` implements graceful fallback to default type
//       arguments (for compilers that don't support non-type default
//       arguments); please verify that this is appropriate in the given
//       situation, and add additional checks if necessary.
//
//       Also, please note that `gsl_ENABLE_IF_()` doesn't enforce the
//       constraint at all if no compiler/library support is available (i.e.
//       pre-C++11).

#if gsl_HAVE(TYPE_TRAITS) && gsl_HAVE(DEFAULT_FUNCTION_TEMPLATE_ARG)
#if !gsl_BETWEEN(gsl_COMPILER_MSVC_VERSION, 1, \
                 140)  // VS 2013 seems to have trouble with SFINAE for default \
                       // non-type arguments
#define gsl_ENABLE_IF_(VA) , typename std::enable_if<(VA), int>::type = 0
#else
#define gsl_ENABLE_IF_(VA) , typename = typename std::enable_if<(VA), ::gsl::detail::enabler>::type
#endif
#else
#define gsl_ENABLE_IF_(VA)
#endif

// Other features:

#define gsl_HAVE_CONSTRAINED_SPAN_CONTAINER_CTOR \
    (gsl_HAVE_DEFAULT_FUNCTION_TEMPLATE_ARG && gsl_HAVE_CONTAINER_DATA_METHOD)
#define gsl_HAVE_CONSTRAINED_SPAN_CONTAINER_CTOR_() gsl_HAVE_CONSTRAINED_SPAN_CONTAINER_CTOR

#define gsl_HAVE_UNCONSTRAINED_SPAN_CONTAINER_CTOR \
    (gsl_CONFIG_ALLOWS_UNCONSTRAINED_SPAN_CONTAINER_CTOR && gsl_COMPILER_NVCC_VERSION == 0)
#define gsl_HAVE_UNCONSTRAINED_SPAN_CONTAINER_CTOR_() gsl_HAVE_UNCONSTRAINED_SPAN_CONTAINER_CTOR

// GSL API (e.g. for CUDA platform):

// Guidelines for using `gsl_api`:
//
// NVCC imposes the restriction that a function annotated `__host__ __device__`
// cannot call host-only or device-only functions. This makes `gsl_api`
// inappropriate for generic functions that call unknown code, e.g. the template
// constructors of `span<>` or functions like `finally()` which accept an
// arbitrary  function object. It is often preferable to annotate functions only
// with `gsl_constexpr` or `gsl_constexpr14`. The "extended constexpr" mode of
// NVCC (currently an experimental feature) will implicitly consider constexpr
// functions `__host__ __device__` functions but tolerates calls to host-only or
// device-only functions.

#ifndef gsl_api
#ifdef __CUDACC__
#define gsl_api __host__ __device__
#else
#define gsl_api /*gsl_api*/
#endif
#endif

// Additional includes:

#if !gsl_CPP11_OR_GREATER
#include <algorithm>  // for swap() before C++11
#endif                // ! gsl_CPP11_OR_GREATER

#if gsl_HAVE(ARRAY)
#include <array>  // indirectly includes reverse_iterator<>
#endif

#if !gsl_HAVE(ARRAY)
#include <iterator>  // for reverse_iterator<>
#endif

#if !gsl_HAVE(CONSTRAINED_SPAN_CONTAINER_CTOR) || !gsl_HAVE(AUTO)
#include <vector>
#endif

#if gsl_HAVE(INITIALIZER_LIST)
#include <initializer_list>
#endif

#if defined(gsl_CONFIG_CONTRACT_VIOLATION_ASSERTS)
#include <cassert>
#endif

#if defined(gsl_CONFIG_CONTRACT_VIOLATION_TRAPS) && \
        gsl_COMPILER_MSVC_VERSION >= 110  // __fastfail() supported by VS 2012 and later
#include <intrin.h>
#endif

#if gsl_HAVE(ENUM_CLASS) && gsl_COMPILER_ARMCC_VERSION
#include <endian.h>
#endif

#if gsl_HAVE(TYPE_TRAITS)
#include <type_traits>  // for enable_if<>,
// add_const<>, add_pointer<>, common_type<>, make_signed<>, remove_cv<>,
// remove_const<>, remove_volatile<>, remove_reference<>, remove_cvref<>,
// remove_pointer<>, underlying_type<>, is_assignable<>, is_constructible<>,
// is_const<>, is_convertible<>, is_integral<>, is_pointer<>, is_signed<>,
// integral_constant<>, declval()
#elif gsl_HAVE(TR1_TYPE_TRAITS)
#include <tr1/type_traits>  // for add_const<>, remove_cv<>, remove_const<>, remove_volatile<>, remove_reference<>, integral_constant<>
#endif

#if gsl_FEATURE(EXPERIMENTAL_RETURN_GUARD)

// Declare __cxa_get_globals() or equivalent in namespace gsl::detail for
// uncaught_exceptions():

#if !gsl_HAVE(UNCAUGHT_EXCEPTIONS)
#if defined(_MSC_VER)  // MS-STL with either MSVC or clang-cl
namespace gsl {
namespace detail {
extern "C" char *__cdecl _getptd();
}
}  // namespace gsl
#elif gsl_COMPILER_CLANG_VERSION || gsl_COMPILER_GNUC_VERSION || gsl_COMPILER_APPLECLANG_VERSION
#if defined(__GLIBCXX__) || defined(__GLIBCPP__)  // libstdc++: prototype from cxxabi.h
#include <cxxabi.h>
#elif !defined(BOOST_CORE_UNCAUGHT_EXCEPTIONS_HPP_INCLUDED_)  // libc++: prototype from \
                                                              // Boost?
#if defined(__FreeBSD__) || defined(__OpenBSD__)
namespace __cxxabiv1 {
struct __cxa_eh_globals;
extern "C" __cxa_eh_globals *__cxa_get_globals();
}  // namespace __cxxabiv1
#else
namespace __cxxabiv1 {
struct __cxa_eh_globals;
extern "C" __cxa_eh_globals *__cxa_get_globals() gsl_noexcept;
}  // namespace __cxxabiv1
#endif
#endif
namespace gsl {
namespace detail {
using ::__cxxabiv1::__cxa_get_globals;
}
}  // namespace gsl
#endif
#endif  // ! gsl_HAVE( UNCAUGHT_EXCEPTIONS )
#endif  // gsl_FEATURE( EXPERIMENTAL_RETURN_GUARD )

// MSVC warning suppression macros:

#if gsl_COMPILER_MSVC_VERSION >= 140 && !gsl_COMPILER_NVCC_VERSION
#define gsl_SUPPRESS_MSGSL_WARNING(expr) /* Pimm: note disabled for intel [[gsl::suppress(expr)]]*/
#define gsl_SUPPRESS_MSVC_WARNING(code, descr) __pragma(warning(suppress : code))
#define gsl_DISABLE_MSVC_WARNINGS(codes) __pragma(warning(push)) __pragma(warning(disable : codes))
#define gsl_RESTORE_MSVC_WARNINGS() __pragma(warning(pop))
#else
// TODO: define for Clang
#define gsl_SUPPRESS_MSGSL_WARNING(expr)
#define gsl_SUPPRESS_MSVC_WARNING(code, descr)
#define gsl_DISABLE_MSVC_WARNINGS(codes)
#define gsl_RESTORE_MSVC_WARNINGS()
#endif

// Suppress the following MSVC GSL warnings:
// - C26432: gsl::c.21 : if you define or delete any default operation in the
// type '...', define or delete them all
// - C26410: gsl::r.32 : the parameter 'ptr' is a reference to const unique
// pointer, use const T* or const T& instead
// - C26415: gsl::r.30 : smart pointer parameter 'ptr' is used only to access
// contained pointer. Use T* or T& instead
// - C26418: gsl::r.36 : shared pointer parameter 'ptr' is not copied or moved.
// Use T* or T& instead
// - C26472: gsl::t.1  : don't use a static_cast for arithmetic conversions;
//                       use brace initialization, gsl::narrow_cast or
//                       gsl::narrow
// - C26439: gsl::f.6  : special function 'function' can be declared 'noexcept'
// - C26440: gsl::f.6  : function 'function' can be declared 'noexcept'
// - C26455: gsl::f.6  : default constructor may not throw. Declare it
// 'noexcept'
// - C26473: gsl::t.1  : don't cast between pointer types where the source type
// and the target type are the same
// - C26481: gsl::b.1  : don't use pointer arithmetic. Use span instead
// - C26482: gsl::b.2  : only index into arrays using constant expressions
// - C26446: gdl::b.4  : prefer to use gsl::at() instead of unchecked subscript
// operator
// - C26490: gsl::t.1  : don't use reinterpret_cast
// - C26487: gsl::l.4  : don't return a pointer '(<some number>'s result)' that
// may be invalid
// - C26457: es.48     : (void) should not be used to ignore return values, use
// 'std::ignore =' instead

gsl_DISABLE_MSVC_WARNINGS(
        26432 26410 26415 26418 26472 26439 26440 26455 26473 26481 26482 26446 26490 26487 26457)

        namespace gsl {
    // forward declare span<>:

    template <class T>
    class span;

    // C++98 emulation:

    namespace std98 {

    // We implement `equal()` and `lexicographical_compare()` here to avoid having
    // to pull in the <algorithm> header.
    template <class InputIt1, class InputIt2>
    bool equal(InputIt1 first1, InputIt1 last1, InputIt2 first2) {
        // Implementation borrowed from
        // https://en.cppreference.com/w/cpp/algorithm/equal.
        for (; first1 != last1; ++first1, ++first2) {
            if (!(*first1 == *first2))
                return false;
        }
        return true;
    }
    template <class InputIt1, class InputIt2>
    bool lexicographical_compare(InputIt1 first1, InputIt1 last1, InputIt2 first2, InputIt2 last2) {
        // Implementation borrowed from
        // https://en.cppreference.com/w/cpp/algorithm/lexicographical_compare.
        for (; first1 != last1 && first2 != last2; ++first1, (void)++first2) {
            if (*first1 < *first2)
                return true;
            if (*first2 < *first1)
                return false;
        }
        return first1 == last1 && first2 != last2;
    }

    }  // namespace std98

    // C++11 emulation:

    namespace std11 {

#if gsl_HAVE(ADD_CONST)

    using std::add_const;

#elif gsl_HAVE(TR1_ADD_CONST)

    using std::tr1::add_const;

#else

    template <class T>
    struct add_const {
        typedef const T type;
    };

#endif  // gsl_HAVE( ADD_CONST )

#if gsl_HAVE(REMOVE_CONST)

    using std::remove_const;
    using std::remove_cv;
    using std::remove_volatile;

#elif gsl_HAVE(TR1_REMOVE_CONST)

    using std::tr1::remove_const;
    using std::tr1::remove_cv;
    using std::tr1::remove_volatile;

#else

    template <class T>
    struct remove_const {
        typedef T type;
    };
    template <class T>
    struct remove_const<T const> {
        typedef T type;
    };

    template <class T>
    struct remove_volatile {
        typedef T type;
    };
    template <class T>
    struct remove_volatile<T volatile> {
        typedef T type;
    };

    template <class T>
    struct remove_cv {
        typedef typename remove_volatile<typename remove_const<T>::type>::type type;
    };

#endif  // gsl_HAVE( REMOVE_CONST )

#if gsl_HAVE(REMOVE_REFERENCE)

    using std::remove_reference;

#elif gsl_HAVE(TR1_REMOVE_REFERENCE)

    using std::tr1::remove_reference;

#else

    template <class T>
    struct remove_reference {
        typedef T type;
    };
    template <class T>
    struct remove_reference<T &> {
        typedef T type;
    };
#if gsl_HAVE(RVALUE_REFERENCE)
    template <class T>
    struct remove_reference<T &&> {
        typedef T type;
    };
#endif

#endif  // gsl_HAVE( REMOVE_REFERENCE )

#if gsl_HAVE(INTEGRAL_CONSTANT)

    using std::false_type;
    using std::integral_constant;
    using std::true_type;

#elif gsl_HAVE(TR1_INTEGRAL_CONSTANT)

    using std::tr1::false_type;
    using std::tr1::integral_constant;
    using std::tr1::true_type;

#else

    template <class T, T v>
    struct integral_constant {
        enum { value = v };
    };
    typedef integral_constant<bool, true> true_type;
    typedef integral_constant<bool, false> false_type;

#endif

#if gsl_HAVE(TYPE_TRAITS)

    using std::underlying_type;

#elif gsl_HAVE(TR1_TYPE_TRAITS)

    using std::tr1::underlying_type;

#else

    // We could try to define `underlying_type<>` for pre-C++11 here, but let's
    // not until someone actually needs it.

#endif

    }  // namespace std11

    // C++14 emulation:

    namespace std14 {

#if gsl_HAVE(UNIQUE_PTR)
#if gsl_HAVE(MAKE_UNIQUE)

    using std::make_unique;

#elif gsl_HAVE(VARIADIC_TEMPLATE)

    template <class T, class... Args>
    gsl_NODISCARD std::unique_ptr<T> make_unique(Args &&...args) {
        return std::unique_ptr<T>(new T(std::forward<Args>(args)...));
    }

#endif  // gsl_HAVE( MAKE_UNIQUE ), gsl_HAVE( VARIADIC_TEMPLATE )
#endif  // gsl_HAVE( UNIQUE_PTR )

    }  // namespace std14

    namespace detail {

#if gsl_HAVE(VARIADIC_TEMPLATE)

    template <bool V0, class T0, class... Ts>
    struct conjunction_ {
        using type = T0;
    };
    template <class T0, class T1, class... Ts>
    struct conjunction_<true, T0, T1, Ts...> : conjunction_<T1::value, T1, Ts...> {};
    template <bool V0, class T0, class... Ts>
    struct disjunction_ {
        using type = T0;
    };
    template <class T0, class T1, class... Ts>
    struct disjunction_<false, T0, T1, Ts...> : disjunction_<T1::value, T1, Ts...> {};

#endif

    template <typename>
    struct dependent_false : std11::integral_constant<bool, false> {};

    }  // namespace detail

    // C++17 emulation:

    namespace std17 {

    template <bool v>
    struct bool_constant : std11::integral_constant<bool, v> {};

#if gsl_CPP11_120

    template <class... Ts>
    struct conjunction;
    template <>
    struct conjunction<> : std11::true_type {};
    template <class T0, class... Ts>
    struct conjunction<T0, Ts...> : detail::conjunction_<T0::value, T0, Ts...>::type {};
    template <class... Ts>
    struct disjunction;
    template <>
    struct disjunction<> : std11::false_type {};
    template <class T0, class... Ts>
    struct disjunction<T0, Ts...> : detail::disjunction_<T0::value, T0, Ts...>::type {};
    template <class T>
    struct negation : std11::integral_constant<bool, !T::value> {};

#if gsl_CPP14_OR_GREATER

    template <class... Ts>
    constexpr bool conjunction_v = conjunction<Ts...>::value;
    template <class... Ts>
    constexpr bool disjunction_v = disjunction<Ts...>::value;
    template <class T>
    constexpr bool negation_v = negation<T>::value;

#endif  // gsl_CPP14_OR_GREATER

    template <class... Ts>
    struct make_void {
        typedef void type;
    };

    template <class... Ts>
    using void_t = typename make_void<Ts...>::type;

#endif  // gsl_CPP11_120

#if gsl_HAVE(CONSTRAINED_SPAN_CONTAINER_CTOR)

    template <class T, size_t N>
    gsl_NODISCARD gsl_api inline gsl_constexpr auto size(T const (&)[N]) gsl_noexcept -> size_t {
        return N;
    }

    template <class C>
    gsl_NODISCARD inline gsl_constexpr auto size(C const &cont) -> decltype(cont.size()) {
        return cont.size();
    }

    template <class T, size_t N>
    gsl_NODISCARD gsl_api inline gsl_constexpr auto data(T (&arr)[N]) gsl_noexcept -> T * {
        return &arr[0];
    }

    template <class C>
    gsl_NODISCARD inline gsl_constexpr auto data(C &cont) -> decltype(cont.data()) {
        return cont.data();
    }

    template <class C>
    gsl_NODISCARD inline gsl_constexpr auto data(C const &cont) -> decltype(cont.data()) {
        return cont.data();
    }

    template <class E>
    gsl_NODISCARD inline gsl_constexpr auto data(std::initializer_list<E> il) gsl_noexcept
            -> E const * {
        return il.begin();
    }

#endif  // gsl_HAVE( CONSTRAINED_SPAN_CONTAINER_CTOR )

    }  // namespace std17

    // C++20 emulation:

    namespace std20 {

#if gsl_CPP11_100

    struct identity {
        template <class T>
        gsl_constexpr T &&operator()(T &&arg) const gsl_noexcept {
            return std::forward<T>(arg);
        }
    };

#if gsl_HAVE(ENUM_CLASS)
    enum class endian {
#if defined(_WIN32)
        little = 0,
        big = 1,
        native = little
#elif gsl_COMPILER_GNUC_VERSION || gsl_COMPILER_CLANG_VERSION || gsl_COMPILER_APPLECLANG_VERSION
        little = __ORDER_LITTLE_ENDIAN__,
        big = __ORDER_BIG_ENDIAN__,
        native = __BYTE_ORDER__
#elif gsl_COMPILER_ARMCC_VERSION
        // from <endian.h> header file
        little = __LITTLE_ENDIAN,
        big = __BIG_ENDIAN,
        native = __BYTE_ORDER
#else
// Do not define any endianness constants for unknown compilers.
#endif
    };
#endif  // gsl_HAVE( ENUM_CLASS )

#endif  // gsl_CPP11_100

    template <class T>
    struct type_identity {
        typedef T type;
    };
#if gsl_HAVE(ALIAS_TEMPLATE)
    template <class T>
    using type_identity_t = typename type_identity<T>::type;
#endif  // gsl_HAVE( ALIAS_TEMPLATE )

#if gsl_HAVE(STD_SSIZE)

    using std::ssize;

#elif gsl_HAVE(CONSTRAINED_SPAN_CONTAINER_CTOR)

    template <class C>
    gsl_NODISCARD gsl_constexpr auto ssize(C const &c) ->
            typename std::common_type<std::ptrdiff_t,
                                      typename std::make_signed<decltype(c.size())>::type>::type {
        using R = typename std::common_type<
                std::ptrdiff_t, typename std::make_signed<decltype(c.size())>::type>::type;
        return static_cast<R>(c.size());
    }

    template <class T, std::size_t N>
    gsl_NODISCARD gsl_constexpr auto ssize(T const (&)[N]) gsl_noexcept -> std::ptrdiff_t {
        return std::ptrdiff_t(N);
    }

#endif  // gsl_HAVE( STD_SSIZE )

#if gsl_HAVE(REMOVE_CVREF)

    using std::remove_cvref;

#else

    template <class T>
    struct remove_cvref {
        typedef typename std11::remove_cv<typename std11::remove_reference<T>::type>::type type;
    };

#endif  // gsl_HAVE( REMOVE_CVREF )

    }  // namespace std20

    namespace detail {

    /// for gsl_ENABLE_IF_()

    /*enum*/ class enabler {};

#if gsl_HAVE(TYPE_TRAITS)

    template <class Q>
    struct is_span_oracle : std::false_type {};

    template <class T>
    struct is_span_oracle<span<T>> : std::true_type {};

    template <class Q>
    struct is_span : is_span_oracle<typename std::remove_cv<Q>::type> {};

    template <class Q>
    struct is_std_array_oracle : std::false_type {};

#if gsl_HAVE(ARRAY)

    template <class T, std::size_t Extent>
    struct is_std_array_oracle<std::array<T, Extent>> : std::true_type {};

#endif

    template <class Q>
    struct is_std_array : is_std_array_oracle<typename std::remove_cv<Q>::type> {};

    template <class Q>
    struct is_array : std::false_type {};

    template <class T>
    struct is_array<T[]> : std::true_type {};

    template <class T, std::size_t N>
    struct is_array<T[N]> : std::true_type {};

#if gsl_CPP11_140 && !gsl_BETWEEN(gsl_COMPILER_GNUC_VERSION, 1, 500)

    template <class, class = void>
    struct has_size_and_data : std::false_type {};

    template <class C>
    struct has_size_and_data<C,
                             std17::void_t<decltype(std17::size(std::declval<C>())),
                                           decltype(std17::data(std::declval<C>()))>>
            : std::true_type {};

    template <class, class, class = void>
    struct is_compatible_element : std::false_type {};

    template <class C, class E>
    struct is_compatible_element<C,
                                 E,
                                 std17::void_t<decltype(std17::data(std::declval<C>())),
                                               typename std::remove_pointer<decltype(std17::data(
                                                       std::declval<C &>()))>::type (*)[]>>
            : std::is_convertible<typename std::remove_pointer<decltype(std17::data(
                                          std::declval<C &>()))>::type (*)[],
                                  E (*)[]> {};

    template <class C>
    struct is_container
            : std17::bool_constant<!is_span<C>::value && !is_array<C>::value &&
                                   !is_std_array<C>::value && has_size_and_data<C>::value> {};

    template <class C, class E>
    struct is_compatible_container
            : std17::bool_constant<is_container<C>::value && is_compatible_element<C, E>::value> {};

#else  // ^^^ gsl_CPP11_140 && ! gsl_BETWEEN( gsl_COMPILER_GNUC_VERSION, 1, 500 ) \
        // ^^^ / vvv ! gsl_CPP11_140 || gsl_BETWEEN( gsl_COMPILER_GNUC_VERSION, 1, \
        // 500 ) vvv

    template <
            class C,
            class E,
            typename = typename std::enable_if<
                    !is_span<C>::value && !is_array<C>::value && !is_std_array<C>::value &&
                            (std::is_convertible<typename std::remove_pointer<decltype(std17::data(
                                                         std::declval<C &>()))>::type (*)[],
                                                 E (*)[]>::value)
                    //  &&   has_size_and_data< C >::value
                    ,
                    enabler>::type,
            class = decltype(std17::size(std::declval<C>())),
            class = decltype(std17::data(std::declval<C>()))>
#if gsl_BETWEEN(gsl_COMPILER_MSVC_VERSION, 1, 140)
    // VS2013 has insufficient support for expression SFINAE; we cannot make
    // `is_compatible_container<>` a proper type trait here
    struct is_compatible_container : std::true_type {
    };
#else
    struct is_compatible_container_r {
        is_compatible_container_r(int);
    };
    template <class C, class E>
    std::true_type is_compatible_container_f(is_compatible_container_r<C, E>);
    template <class C, class E>
    std::false_type is_compatible_container_f(...);

    template <class C, class E>
    struct is_compatible_container : decltype(is_compatible_container_f<C, E>(0)) {};
#endif  // gsl_BETWEEN( gsl_COMPILER_MSVC_VERSION, 1, 140 )

#endif  // gsl_CPP11_140 && ! gsl_BETWEEN( gsl_COMPILER_GNUC_VERSION, 1, 500 )

#endif  // gsl_HAVE( TYPE_TRAITS )

    }  // namespace detail

    //
    // GSL.util: utilities
    //

    // Integer type for indices (e.g. in a loop).
    typedef gsl_CONFIG_INDEX_TYPE index;

    // Integer type for dimensions.
    typedef gsl_CONFIG_INDEX_TYPE dim;

    // Integer type for array strides.
    typedef gsl_CONFIG_INDEX_TYPE stride;

    // Integer type for pointer, iterator, or index differences.
    typedef gsl_CONFIG_INDEX_TYPE diff;

//
// GSL.owner: ownership pointers
//
#if gsl_HAVE(SHARED_PTR)
    using std::make_shared;
    using std::shared_ptr;
    using std::unique_ptr;
#if gsl_HAVE(MAKE_UNIQUE) || gsl_HAVE(VARIADIC_TEMPLATE)
    using std14::make_unique;
#endif
#endif

#if gsl_HAVE(ALIAS_TEMPLATE)
    template <class T
#if gsl_HAVE(TYPE_TRAITS)
              ,
              typename = typename std::enable_if<std::is_pointer<T>::value>::type
#endif
              >
    using owner = T;
#elif gsl_CONFIG(DEFAULTS_VERSION) == 0
    // TODO vNext: remove
    template <class T>
    struct owner {
        typedef T type;
    };
#endif

#define gsl_HAVE_OWNER_TEMPLATE gsl_HAVE_ALIAS_TEMPLATE
#define gsl_HAVE_OWNER_TEMPLATE_() gsl_HAVE_OWNER_TEMPLATE

// TODO vNext: remove
#if gsl_FEATURE(OWNER_MACRO)
#if gsl_HAVE(OWNER_TEMPLATE)
#define Owner(t) ::gsl::owner<t>
#else
#define Owner(t) ::gsl::owner<t>::type
#endif
#endif

    //
    // GSL.assert: assertions
    //

#if gsl_HAVE(TYPE_TRAITS)
#define gsl_ELIDE_(x)                                                \
    static_assert(::std::is_constructible<bool, decltype(x)>::value, \
                  "argument of contract check must be convertible to bool")
#else
#define gsl_ELIDE_(x)
#endif
#define gsl_NO_OP_() (static_cast<void>(0))

#if defined(gsl_CONFIG_UNENFORCED_CONTRACTS_ASSUME)
#if defined(__CUDACC__) && defined(__CUDA_ARCH__)
#if gsl_COMPILER_NVCC_VERSION >= 113
#define gsl_ASSUME_(x) ((x) ? static_cast<void>(0) : __builtin_unreachable())
#define gsl_ASSUME_UNREACHABLE_() __builtin_unreachable()
#else
#define gsl_ASSUME_(x) gsl_ELIDE_(x) /* there is no assume intrinsic in CUDA device code */
#define gsl_ASSUME_UNREACHABLE_() \
    gsl_NO_OP_() /* there is no assume intrinsic in CUDA device code */
#endif
#elif gsl_COMPILER_MSVC_VERSION >= 140
#define gsl_ASSUME_(x) __assume(x)
#define gsl_ASSUME_UNREACHABLE_() __assume(0)
#elif gsl_COMPILER_GNUC_VERSION
#define gsl_ASSUME_(x) ((x) ? static_cast<void>(0) : __builtin_unreachable())
#define gsl_ASSUME_UNREACHABLE_() __builtin_unreachable()
#elif defined(__has_builtin)
#if __has_builtin(__builtin_unreachable)
#define gsl_ASSUME_(x) ((x) ? static_cast<void>(0) : __builtin_unreachable())
#define gsl_ASSUME_UNREACHABLE_() __builtin_unreachable()
#else
#error gsl_CONFIG_UNENFORCED_CONTRACTS_ASSUME: gsl-lite does not know how to generate UB optimization hints for this compiler; use gsl_CONFIG_UNENFORCED_CONTRACTS_ELIDE instead
#endif
#else
#error gsl_CONFIG_UNENFORCED_CONTRACTS_ASSUME: gsl-lite does not know how to generate UB optimization hints for this compiler; use gsl_CONFIG_UNENFORCED_CONTRACTS_ELIDE instead
#endif
#endif  // defined( gsl_CONFIG_UNENFORCED_CONTRACTS_ASSUME )

#if defined(gsl_CONFIG_UNENFORCED_CONTRACTS_ASSUME)
#define gsl_CONTRACT_UNENFORCED_(x) gsl_ASSUME_(x)
#else  // defined( gsl_CONFIG_UNENFORCED_CONTRACTS_ELIDE ) [default]
#define gsl_CONTRACT_UNENFORCED_(x) gsl_ELIDE_(x)
#endif

#if defined(gsl_CONFIG_CONTRACT_VIOLATION_TRAPS)
#if defined(__CUDACC__) && defined(__CUDA_ARCH__)
#define gsl_TRAP_() __trap()
#elif gsl_COMPILER_MSVC_VERSION >= 110  // __fastfail() supported by VS 2012 and later
#define gsl_TRAP_() \
    __fastfail(0) /* legacy failure code for buffer-overrun errors, cf. winnt.h, \
                   "Fast fail failure codes" */
#elif gsl_COMPILER_GNUC_VERSION
#define gsl_TRAP_() __builtin_trap()
#elif defined(__has_builtin)
#if __has_builtin(__builtin_trap)
#define gsl_TRAP_() __builtin_trap()
#else
#error gsl_CONFIG_CONTRACT_VIOLATION_TRAPS: gsl-lite does not know how to generate a trap instruction for this compiler; use gsl_CONFIG_CONTRACT_VIOLATION_TERMINATES instead
#endif
#else
#error gsl_CONFIG_CONTRACT_VIOLATION_TRAPS: gsl-lite does not know how to generate a trap instruction for this compiler; use gsl_CONFIG_CONTRACT_VIOLATION_TERMINATES instead
#endif
#endif  // defined( gsl_CONFIG_CONTRACT_VIOLATION_TRAPS )

#if defined(gsl_CONFIG_CONTRACT_VIOLATION_CALLS_HANDLER)
#define gsl_CONTRACT_CHECK_(str, x) \
    ((x) ? static_cast<void>(0) : ::gsl::fail_fast_assert_handler(#x, str, __FILE__, __LINE__))
#if defined(__CUDACC__) && defined(__CUDA_ARCH__)
#define gsl_FAILFAST_()                                                       \
    (::gsl::fail_fast_assert_handler("", "GSL: failure", __FILE__, __LINE__), \
     gsl_TRAP_()) /* do not let the custom assertion handler continue execution  \
                 */
#else
#define gsl_FAILFAST_()                                                       \
    (::gsl::fail_fast_assert_handler("", "GSL: failure", __FILE__, __LINE__), \
     ::gsl::detail::fail_fast_terminate()) /* do not let the custom assertion    \
                                            handler continue execution */
#endif
#elif defined(__CUDACC__) && defined(__CUDA_ARCH__)
#if defined(gsl_CONFIG_CONTRACT_VIOLATION_ASSERTS) || !defined(NDEBUG)
#define gsl_CONTRACT_CHECK_(str, x) assert(str && (x))
#else
#define gsl_CONTRACT_CHECK_(str, x) ((x) ? static_cast<void>(0) : __trap())
#endif
#define gsl_FAILFAST_() (__trap())
#elif defined(gsl_CONFIG_CONTRACT_VIOLATION_ASSERTS)
#define gsl_CONTRACT_CHECK_(str, x) assert(str && (x))
#if !defined(NDEBUG)
#define gsl_FAILFAST_() (assert(!"GSL: failure"), ::gsl::detail::fail_fast_terminate())
#else
#define gsl_FAILFAST_() (::gsl::detail::fail_fast_terminate())
#endif
#elif defined(gsl_CONFIG_CONTRACT_VIOLATION_TRAPS)
#define gsl_CONTRACT_CHECK_(str, x) ((x) ? static_cast<void>(0) : gsl_TRAP_())
#if gsl_COMPILER_MSVC_VERSION
#define gsl_FAILFAST_() (gsl_TRAP_(), ::gsl::detail::fail_fast_terminate())
#else
#define gsl_FAILFAST_() (gsl_TRAP_())
#endif
#elif defined(gsl_CONFIG_CONTRACT_VIOLATION_THROWS)
#define gsl_CONTRACT_CHECK_(str, x)                                     \
    ((x) ? static_cast<void>(0)                                         \
         : ::gsl::detail::fail_fast_throw(str ": '" #x "' at " __FILE__ \
                                              ":" gsl_STRINGIFY(__LINE__)))
#define gsl_FAILFAST_() \
    (::gsl::detail::fail_fast_throw("GSL: failure at " __FILE__ ":" gsl_STRINGIFY(__LINE__)))
#else  // defined( gsl_CONFIG_CONTRACT_VIOLATION_TERMINATES ) [default]
#define gsl_CONTRACT_CHECK_(str, x) \
    ((x) ? static_cast<void>(0) : ::gsl::detail::fail_fast_terminate())
#define gsl_FAILFAST_() (::gsl::detail::fail_fast_terminate())
#endif

#if defined(gsl_CONFIG_CONTRACT_CHECKING_OFF) || defined(gsl_CONFIG_CONTRACT_CHECKING_EXPECTS_OFF)
#define gsl_Expects(x) gsl_CONTRACT_UNENFORCED_(x)
#else
#define gsl_Expects(x) gsl_CONTRACT_CHECK_("GSL: Precondition failure", x)
#endif
#define Expects(x) gsl_Expects(x)
#if !defined(gsl_CONFIG_CONTRACT_CHECKING_AUDIT) || \
        defined(gsl_CONFIG_CONTRACT_CHECKING_EXPECTS_OFF)
#define gsl_ExpectsAudit(x) gsl_ELIDE_(x)
#else
#define gsl_ExpectsAudit(x) gsl_CONTRACT_CHECK_("GSL: Precondition failure (audit)", x)
#endif

#if defined(gsl_CONFIG_CONTRACT_CHECKING_OFF) || defined(gsl_CONFIG_CONTRACT_CHECKING_ENSURES_OFF)
#define gsl_Ensures(x) gsl_CONTRACT_UNENFORCED_(x)
#else
#define gsl_Ensures(x) gsl_CONTRACT_CHECK_("GSL: Postcondition failure", x)
#endif
#define Ensures(x) gsl_Ensures(x)
#if !defined(gsl_CONFIG_CONTRACT_CHECKING_AUDIT) || \
        defined(gsl_CONFIG_CONTRACT_CHECKING_ENSURES_OFF)
#define gsl_EnsuresAudit(x) gsl_ELIDE_(x)
#else
#define gsl_EnsuresAudit(x) gsl_CONTRACT_CHECK_("GSL: Postcondition failure (audit)", x)
#endif

#if defined(gsl_CONFIG_CONTRACT_CHECKING_OFF) || defined(gsl_CONFIG_CONTRACT_CHECKING_ASSERT_OFF)
#define gsl_Assert(x) gsl_CONTRACT_UNENFORCED_(x)
#else
#define gsl_Assert(x) gsl_CONTRACT_CHECK_("GSL: Assertion failure", x)
#endif
#if !defined(gsl_CONFIG_CONTRACT_CHECKING_AUDIT) || defined(gsl_CONFIG_CONTRACT_CHECKING_ASSERT_OFF)
#define gsl_AssertAudit(x) gsl_ELIDE_(x)
#else
#define gsl_AssertAudit(x) gsl_CONTRACT_CHECK_("GSL: Assertion failure (audit)", x)
#endif

#define gsl_FailFast() gsl_FAILFAST_()

    struct fail_fast : public std::logic_error {
        explicit fail_fast(char const *message) : std::logic_error(message) {}
    };

    namespace detail {

#if gsl_HAVE(EXCEPTIONS)
    gsl_NORETURN inline void fail_fast_throw(char const *message) { throw fail_fast(message); }
#endif  // gsl_HAVE( EXCEPTIONS )
    gsl_NORETURN inline void fail_fast_terminate() gsl_noexcept { std::terminate(); }

    }  // namespace detail

    // Should be defined by user
    gsl_api void fail_fast_assert_handler(char const *const expression, char const *const message,
                                          char const *const file, int line);

#if defined(gsl_CONFIG_CONTRACT_VIOLATION_THROWS)

#if gsl_HAVE(EXCEPTIONS)
    gsl_DEPRECATED_MSG(
            "don't call gsl::fail_fast_assert() directly; use "
            "contract checking macros instead") gsl_constexpr14 inline void
    fail_fast_assert(bool cond, char const *const message) {
        if (!cond)
            throw fail_fast(message);
    }
#endif  // gsl_HAVE( EXCEPTIONS )

#elif defined(gsl_CONFIG_CONTRACT_VIOLATION_CALLS_HANDLER)

    gsl_DEPRECATED_MSG(
            "don't call gsl::fail_fast_assert() directly; use "
            "contract checking macros instead") gsl_api gsl_constexpr14 inline void
    fail_fast_assert(bool cond, char const *const expression, char const *const message,
                     char const *const file, int line) {
        if (!cond)
            ::gsl::fail_fast_assert_handler(expression, message, file, line);
    }

#else  // defined( gsl_CONFIG_CONTRACT_VIOLATION_TERMINATES ) [default]

    gsl_DEPRECATED_MSG(
            "don't call gsl::fail_fast_assert() directly; use "
            "contract checking macros instead") gsl_constexpr14 inline void
    fail_fast_assert(bool cond) gsl_noexcept {
        if (!cond)
            std::terminate();
    }

#endif

    //
    // GSL.util: utilities
    //

#if gsl_FEATURE(EXPERIMENTAL_RETURN_GUARD)

    // Add uncaught_exceptions for pre-2017 MSVC, GCC and Clang
    // Return unsigned char to save stack space, uncaught_exceptions can only
    // increase by 1 in a scope

    namespace std11 {

#if gsl_HAVE(UNCAUGHT_EXCEPTIONS)

    inline unsigned char uncaught_exceptions() gsl_noexcept {
        return static_cast<unsigned char>(std::uncaught_exceptions());
    }

#else                  // ! gsl_HAVE( UNCAUGHT_EXCEPTIONS )
#if defined(_MSC_VER)  // MS-STL with either MSVC or clang-cl

    inline unsigned char uncaught_exceptions() gsl_noexcept {
        return static_cast<unsigned char>(*reinterpret_cast<unsigned const *>(
                detail::_getptd() + (sizeof(void *) == 8 ? 0x100 : 0x90)));
    }

#elif gsl_COMPILER_CLANG_VERSION || gsl_COMPILER_GNUC_VERSION || gsl_COMPILER_APPLECLANG_VERSION

    inline unsigned char uncaught_exceptions() gsl_noexcept {
        return static_cast<unsigned char>((*reinterpret_cast<unsigned const *>(
                reinterpret_cast<unsigned char const *>(detail::__cxa_get_globals()) +
                sizeof(void *))));
    }

#endif
#endif

    }  // namespace std11

#endif  // gsl_FEATURE( EXPERIMENTAL_RETURN_GUARD )

#if gsl_STDLIB_CPP11_110

    gsl_DISABLE_MSVC_WARNINGS(4702)  // unreachable code

            template <class F>
            class final_action {
    public:
        explicit final_action(F action) gsl_noexcept : action_(std::move(action)), invoke_(true) {}

        final_action(final_action &&other) gsl_noexcept : action_(std::move(other.action_)),
                                                          invoke_(other.invoke_) {
            other.invoke_ = false;
        }

        gsl_SUPPRESS_MSGSL_WARNING(f .6) virtual ~final_action() gsl_noexcept {
            if (invoke_)
                action_();
        }

        gsl_is_delete_access : final_action(final_action const &) gsl_is_delete;
        final_action &operator=(final_action const &) gsl_is_delete;
        final_action &operator=(final_action &&) gsl_is_delete;

    protected:
        void dismiss() gsl_noexcept { invoke_ = false; }

    private:
        F action_;
        bool invoke_;
    };

    template <class F>
    gsl_NODISCARD inline final_action<F> finally(F const &action) gsl_noexcept {
        return final_action<F>(action);
    }

    template <class F>
    gsl_NODISCARD inline final_action<F> finally(F && action) gsl_noexcept {
        return final_action<F>(std::forward<F>(action));
    }

#if gsl_FEATURE(EXPERIMENTAL_RETURN_GUARD)

    template <class F>
    class final_action_return : public final_action<F> {
    public:
        explicit final_action_return(F &&action) gsl_noexcept
                : final_action<F>(std::move(action)),
                  exception_count(std11::uncaught_exceptions()) {}

        final_action_return(final_action_return &&other) gsl_noexcept
                : final_action<F>(std::move(other)),
                  exception_count(std11::uncaught_exceptions()) {}

        ~final_action_return() override {
            if (std11::uncaught_exceptions() != exception_count)
                this->dismiss();
        }

        gsl_is_delete_access : final_action_return(final_action_return const &) gsl_is_delete;
        final_action_return &operator=(final_action_return const &) gsl_is_delete;

    private:
        unsigned char exception_count;
    };

    template <class F>
    gsl_NODISCARD inline final_action_return<F> on_return(F const &action) gsl_noexcept {
        return final_action_return<F>(action);
    }

    template <class F>
    gsl_NODISCARD inline final_action_return<F> on_return(F && action) gsl_noexcept {
        return final_action_return<F>(std::forward<F>(action));
    }

    template <class F>
    class final_action_error : public final_action<F> {
    public:
        explicit final_action_error(F &&action) gsl_noexcept
                : final_action<F>(std::move(action)),
                  exception_count(std11::uncaught_exceptions()) {}

        final_action_error(final_action_error &&other) gsl_noexcept
                : final_action<F>(std::move(other)),
                  exception_count(std11::uncaught_exceptions()) {}

        ~final_action_error() override {
            if (std11::uncaught_exceptions() == exception_count)
                this->dismiss();
        }

        gsl_is_delete_access : final_action_error(final_action_error const &) gsl_is_delete;
        final_action_error &operator=(final_action_error const &) gsl_is_delete;

    private:
        unsigned char exception_count;
    };

    template <class F>
    gsl_NODISCARD inline final_action_error<F> on_error(F const &action) gsl_noexcept {
        return final_action_error<F>(action);
    }

    template <class F>
    gsl_NODISCARD inline final_action_error<F> on_error(F && action) gsl_noexcept {
        return final_action_error<F>(std::forward<F>(action));
    }

#endif  // gsl_FEATURE( EXPERIMENTAL_RETURN_GUARD )

    gsl_RESTORE_MSVC_WARNINGS()
#else  // ! gsl_STDLIB_CPP11_110

    class final_action {
    public:
        typedef void (*Action)();

        final_action(Action action) : action_(action), invoke_(true) {}

        final_action(final_action const &other) : action_(other.action_), invoke_(other.invoke_) {
            other.invoke_ = false;
        }

        virtual ~final_action() {
            if (invoke_)
                action_();
        }

    protected:
        void dismiss() { invoke_ = false; }

    private:
        final_action &operator=(final_action const &);

    private:
        Action action_;
        mutable bool invoke_;
    };

    template <class F>
    inline final_action finally(F const &f) {
        return final_action((f));
    }

#if gsl_FEATURE(EXPERIMENTAL_RETURN_GUARD)

    class final_action_return : public final_action {
    public:
        explicit final_action_return(Action action)
                : final_action(action), exception_count(std11::uncaught_exceptions()) {}

        ~final_action_return() {
            if (std11::uncaught_exceptions() != exception_count)
                this->dismiss();
        }

    private:
        final_action_return &operator=(final_action_return const &);

    private:
        unsigned char exception_count;
    };

    template <class F>
    inline final_action_return on_return(F const &action) {
        return final_action_return(action);
    }

    class final_action_error : public final_action {
    public:
        explicit final_action_error(Action action)
                : final_action(action), exception_count(std11::uncaught_exceptions()) {}

        ~final_action_error() {
            if (std11::uncaught_exceptions() == exception_count)
                this->dismiss();
        }

    private:
        final_action_error &operator=(final_action_error const &);

    private:
        unsigned char exception_count;
    };

    template <class F>
    inline final_action_error on_error(F const &action) {
        return final_action_error(action);
    }

#endif  // gsl_FEATURE( EXPERIMENTAL_RETURN_GUARD )

#endif  // gsl_STDLIB_CPP11_110

#if gsl_STDLIB_CPP11_120

            template <class T, class U>
            gsl_NODISCARD gsl_api inline gsl_constexpr T narrow_cast(U && u) gsl_noexcept {
        return static_cast<T>(std::forward<U>(u));
    }

#else  // ! gsl_STDLIB_CPP11_120

    template <class T, class U>
    gsl_api inline T narrow_cast(U u) gsl_noexcept {
        return static_cast<T>(u);
    }

#endif  // gsl_STDLIB_CPP11_120

    struct narrowing_error : public std::exception {
        char const *what() const gsl_noexcept
#if gsl_HAVE(OVERRIDE_FINAL)
                override
#endif
        {
            return "narrowing_error";
        }
    };

#if gsl_HAVE(TYPE_TRAITS)

    namespace detail {

    template <class T, class U>
    struct is_same_signedness
            : public std::integral_constant<bool,
                                            std::is_signed<T>::value == std::is_signed<U>::value> {
    };

#if gsl_COMPILER_NVCC_VERSION
    // We do this to circumvent NVCC warnings about pointless unsigned comparisons
    // with 0.
    template <class T>
    gsl_constexpr gsl_api bool is_negative(T value, std::true_type /*isSigned*/) gsl_noexcept {
        return value < T();
    }
    template <class T>
    gsl_constexpr gsl_api bool is_negative(T /*value*/,
                                           std::false_type /*isUnsigned*/) gsl_noexcept {
        return false;
    }
    template <class T, class U>
    gsl_constexpr gsl_api bool have_same_sign(T,
                                              U,
                                              std::true_type /*isSameSignedness*/) gsl_noexcept {
        return true;
    }
    template <class T, class U>
    gsl_constexpr gsl_api bool have_same_sign(T t,
                                              U u,
                                              std::false_type /*isSameSignedness*/) gsl_noexcept {
        return detail::is_negative(t, std::is_signed<T>()) ==
               detail::is_negative(u, std::is_signed<U>());
    }
#endif  // gsl_COMPILER_NVCC_VERSION

    }  // namespace detail

#endif

    template <class T, class U>
    gsl_NODISCARD
#if !gsl_CONFIG(NARROW_THROWS_ON_TRUNCATION) && !defined(gsl_CONFIG_CONTRACT_VIOLATION_THROWS)
            gsl_api
#endif
            inline T
            narrow(U u) {
#if gsl_CONFIG(NARROW_THROWS_ON_TRUNCATION) && !gsl_HAVE(EXCEPTIONS)
        gsl_STATIC_ASSERT_(detail::dependent_false<T>::value,
                           "According to the GSL specification, narrow<>() throws an exception of "
                           "type narrowing_error on truncation. Therefore "
                           "it cannot be used if exceptions are disabled. Consider using "
                           "narrow_failfast<>() instead which raises a precondition "
                           "violation if the given value cannot be represented in the target "
                           "type.");
#endif

        T t = static_cast<T>(u);

        if (static_cast<U>(t) != u) {
#if gsl_HAVE(EXCEPTIONS) && \
        (gsl_CONFIG(NARROW_THROWS_ON_TRUNCATION) || defined(gsl_CONFIG_CONTRACT_VIOLATION_THROWS))
            throw narrowing_error();
#else
            std::terminate();
#endif
        }

#if gsl_HAVE(TYPE_TRAITS)
#if gsl_COMPILER_NVCC_VERSION
        if (!detail::have_same_sign(t, u, detail::is_same_signedness<T, U>()))
#else
        gsl_SUPPRESS_MSVC_WARNING(
                4127,
                "conditional expression is constant") if (!detail::is_same_signedness<T,
                                                                                      U>::value &&
                                                          (t < T()) != (u < U()))
#endif
#else
        // Don't assume T() works:
        gsl_SUPPRESS_MSVC_WARNING(4127,
                                  "conditional expression is constant") if ((t < 0) != (u < 0))
#endif
        {
#if gsl_HAVE(EXCEPTIONS) && \
        (gsl_CONFIG(NARROW_THROWS_ON_TRUNCATION) || defined(gsl_CONFIG_CONTRACT_VIOLATION_THROWS))
            throw narrowing_error();
#else
            std::terminate();
#endif
        }

        return t;
    }

    template <class T, class U>
    gsl_NODISCARD gsl_api inline T narrow_failfast(U u) {
        T t = static_cast<T>(u);

        gsl_Expects(static_cast<U>(t) == u);

#if gsl_HAVE(TYPE_TRAITS)
#if gsl_COMPILER_NVCC_VERSION
        gsl_Expects(::gsl::detail::have_same_sign(t, u, ::gsl::detail::is_same_signedness<T, U>()));
#else
        gsl_SUPPRESS_MSVC_WARNING(4127, "conditional expression is constant") gsl_Expects(
                (::gsl::detail::is_same_signedness<T, U>::value || (t < T()) == (u < U())));
#endif
#else
        // Don't assume T() works:
        gsl_SUPPRESS_MSVC_WARNING(4127, "conditional expression is constant")
                gsl_Expects((t < 0) == (u < 0));
#endif

        return t;
    }

    //
    // at() - Bounds-checked way of accessing static arrays, std::array,
    // std::vector.
    //

    template <class T, size_t N>
    gsl_NODISCARD gsl_api inline gsl_constexpr14 T &at(T(&arr)[N], size_t pos) {
        gsl_Expects(pos < N);
        return arr[pos];
    }

    template <class Container>
    gsl_NODISCARD gsl_api inline gsl_constexpr14 typename Container::value_type &at(
            Container & cont, size_t pos) {
        gsl_Expects(pos < cont.size());
        return cont[pos];
    }

    template <class Container>
    gsl_NODISCARD gsl_api inline gsl_constexpr14 typename Container::value_type const &at(
            Container const &cont, size_t pos) {
        gsl_Expects(pos < cont.size());
        return cont[pos];
    }

#if gsl_HAVE(INITIALIZER_LIST)

    template <class T>
    gsl_NODISCARD gsl_api inline const gsl_constexpr14 T at(std::initializer_list<T> cont,
                                                            size_t pos) {
        gsl_Expects(pos < cont.size());
        return *(cont.begin() + pos);
    }
#endif

    template <class T>
    gsl_NODISCARD gsl_api inline gsl_constexpr14 T &at(span<T> s, size_t pos) {
        return s[pos];
    }

    //
    // GSL.views: views
    //

    //
    // not_null<> - Wrap any indirection and enforce non-null.
    //

    template <class T>
    class not_null;

    namespace detail {

// helper class to figure out the pointed-to type of a pointer
#if gsl_STDLIB_CPP11_OR_GREATER
    template <class T, class E = void>
    struct element_type_helper {
        // For types without a member element_type (this will handle raw pointers)
        typedef typename std::remove_reference<decltype(*std::declval<T>())>::type type;
    };

    template <class T>
    struct element_type_helper<T, std17::void_t<typename T::element_type>> {
        // For types with a member element_type
        typedef typename T::element_type type;
    };
#else   // ! gsl_STDLIB_CPP11_OR_GREATER
    // Pre-C++11, we cannot have decltype, so we cannot handle types without a
    // member element_type
    template <class T, class E = void>
    struct element_type_helper {
        typedef typename T::element_type type;
    };

    template <class T>
    struct element_type_helper<T *> {
        typedef T type;
    };
#endif  // gsl_STDLIB_CPP11_OR_GREATER

    template <class T>
    struct is_not_null_or_bool_oracle : std11::false_type {};
    template <class T>
    struct is_not_null_or_bool_oracle<not_null<T>> : std11::true_type {};
    template <>
    struct is_not_null_or_bool_oracle<bool> : std11::true_type {};

    template <class T, bool IsCopyable = true>
    struct not_null_data;
#if gsl_HAVE(MOVE_FORWARD)
    template <class T>
    struct not_null_data<T, false> {
        T ptr_;

        gsl_api gsl_constexpr14 not_null_data(T &&_ptr) gsl_noexcept : ptr_(std::move(_ptr)) {}

        gsl_api gsl_constexpr14 not_null_data(not_null_data &&other) gsl_noexcept
                : ptr_(std::move(other.ptr_)) {}
        gsl_api gsl_constexpr14 not_null_data &operator=(not_null_data &&other) gsl_noexcept {
            ptr_ = std::move(other.ptr_);
            return *this;
        }

        gsl_is_delete_access : not_null_data(not_null_data const &) gsl_is_delete;
        not_null_data &operator=(not_null_data const &) gsl_is_delete;
    };
#if gsl_CONFIG_DEFAULTS_VERSION >= 1
#endif  // gsl_CONFIG_DEFAULTS_VERSION >= 1
#endif  // gsl_HAVE( MOVE_FORWARD )
    template <class T>
    struct not_null_data<T, true> {
        T ptr_;

        gsl_api gsl_constexpr14 not_null_data(T const &_ptr) gsl_noexcept : ptr_(_ptr) {}

#if gsl_HAVE(MOVE_FORWARD)
        gsl_api gsl_constexpr14 not_null_data(T &&_ptr) gsl_noexcept : ptr_(std::move(_ptr)) {}

        gsl_api gsl_constexpr14 not_null_data(not_null_data &&other) gsl_noexcept
                : ptr_(std::move(other.ptr_)) {}
        gsl_api gsl_constexpr14 not_null_data &operator=(not_null_data &&other) gsl_noexcept {
            ptr_ = std::move(other.ptr_);
            return *this;
        }
#endif  // gsl_HAVE( MOVE_FORWARD )

        gsl_api gsl_constexpr14 not_null_data(not_null_data const &other) : ptr_(other.ptr_) {
            gsl_Expects(ptr_ != gsl_nullptr);
        }
        gsl_api gsl_constexpr14 not_null_data &operator=(not_null_data const &other) {
            gsl_Expects(other.ptr_ != gsl_nullptr);
            ptr_ = other.ptr_;
            return *this;
        }
    };
#if gsl_CONFIG_DEFAULTS_VERSION >= 1
    template <class T>
    struct not_null_data<T *, true> {
        T *ptr_;

        gsl_api gsl_constexpr14 not_null_data(T *_ptr) gsl_noexcept : ptr_(_ptr) {}
    };
#endif  // gsl_CONFIG_DEFAULTS_VERSION >= 1
    template <class T>
    struct is_copyable
#if gsl_HAVE(TYPE_TRAITS)
            : std11::integral_constant<bool,
                                       std::is_copy_constructible<T>::value &&
                                               std::is_copy_assignable<T>::value>
#else
            : std11::true_type
#endif
    {
    };
#if gsl_HAVE(TYPE_TRAITS) && gsl_HAVE(UNIQUE_PTR) && gsl_BETWEEN(gsl_COMPILER_MSVC_VERSION, 1, 140)
    // Type traits are buggy in VC++ 2013, so we explicitly declare `unique_ptr<>`
    // non-copyable.
    template <class T, class Deleter>
    struct is_copyable<std::unique_ptr<T, Deleter>> : std11::false_type {};
#endif

    template <class T>
    struct not_null_accessor;

    }  // namespace detail

    template <class T>
    class not_null {
    private:
        detail::not_null_data<T, detail::is_copyable<T>::value> data_;

        // need to access `not_null<U>::data_`
        template <class U>
        friend class not_null;

        template <class U>
        friend struct detail::not_null_accessor;

    public:
        typedef typename detail::element_type_helper<T>::type element_type;

#if gsl_HAVE(TYPE_TRAITS)
        static_assert(
                std::is_assignable<
                        typename std::remove_const<typename std::remove_reference<T>::type>::type &,
                        std::nullptr_t>::value,
                "T cannot be assigned nullptr.");
#endif

#if gsl_CONFIG(NOT_NULL_EXPLICIT_CTOR)
#if gsl_HAVE(MOVE_FORWARD)
        template <class U
        // In Clang 3.x, `is_constructible<not_null<unique_ptr<X>>, unique_ptr<X>>`
        // tries to instantiate the copy constructor of `unique_ptr<>`, triggering
        // an error. Note that Apple Clang's `__clang_major__` etc. are different
        // from regular Clang.
#if gsl_HAVE(TYPE_TRAITS) && gsl_HAVE(DEFAULT_FUNCTION_TEMPLATE_ARG) && \
        !gsl_BETWEEN(gsl_COMPILER_CLANG_VERSION, 1, 400) &&             \
        !gsl_BETWEEN(gsl_COMPILER_APPLECLANG_VERSION, 1, 1001)
                  // We *have* to use SFINAE with an NTTP arg here, otherwise the
                  // overload is ambiguous.
                  ,
                  typename std::enable_if<(std::is_constructible<T, U>::value), int>::type = 0
#endif
                  >
        gsl_api gsl_constexpr14 explicit not_null(U other) : data_(T(std::move(other))) {
            gsl_Expects(data_.ptr_ != gsl_nullptr);
        }
#else   // a.k.a. ! gsl_HAVE( MOVE_FORWARD )
        template <class U>
        gsl_api gsl_constexpr14 explicit not_null(U const &other) : data_(T(other)) {
            gsl_Expects(data_.ptr_ != gsl_nullptr);
        }
#endif  // gsl_HAVE( MOVE_FORWARD )
#else   // a.k.a. !gsl_CONFIG( NOT_NULL_EXPLICIT_CTOR )
#if gsl_HAVE(MOVE_FORWARD)
        // In Clang 3.x, `is_constructible<not_null<unique_ptr<X>>, unique_ptr<X>>`
        // tries to instantiate the copy constructor of `unique_ptr<>`, triggering
        // an error. Note that Apple Clang's `__clang_major__` etc. are different
        // from regular Clang.
#if gsl_HAVE(TYPE_TRAITS) && gsl_HAVE(DEFAULT_FUNCTION_TEMPLATE_ARG) && \
        !gsl_BETWEEN(gsl_COMPILER_CLANG_VERSION, 1, 400) &&             \
        !gsl_BETWEEN(gsl_COMPILER_APPLECLANG_VERSION, 1, 1001)
        template <class U
                  // We *have* to use SFINAE with an NTTP arg here, otherwise the
                  // overload is ambiguous.
                  ,
                  typename std::enable_if<(std::is_constructible<T, U>::value &&
                                           !std::is_convertible<U, T>::value),
                                          int>::type = 0>
        gsl_api gsl_constexpr14 explicit not_null(U other) : data_(T(std::move(other))) {
            gsl_Expects(data_.ptr_ != gsl_nullptr);
        }

        template <class U
                  // We *have* to use SFINAE with an NTTP arg here, otherwise the
                  // overload is ambiguous.
                  ,
                  typename std::enable_if<(std::is_convertible<U, T>::value), int>::type = 0>
        gsl_api gsl_constexpr14 not_null(U other) : data_(std::move(other)) {
            gsl_Expects(data_.ptr_ != gsl_nullptr);
        }
#else   // a.k.a. !( gsl_HAVE( TYPE_TRAITS ) && gsl_HAVE(         \
        // DEFAULT_FUNCTION_TEMPLATE_ARG ) && ! gsl_BETWEEN(      \
        // gsl_COMPILER_CLANG_VERSION, 1, 400 ) && ! gsl_BETWEEN( \
        // gsl_COMPILER_APPLECLANG_VERSION, 1, 1001 )                  \
        // If type_traits are not available, then we can't distinguish               \
        // `is_convertible<>` and `is_constructible<>`, so we unconditionally permit \
        // implicit construction.
        template <class U>
        gsl_api gsl_constexpr14 not_null(U other) : data_(T(std::move(other))) {
            gsl_Expects(data_.ptr_ != gsl_nullptr);
        }
#endif  // gsl_HAVE( TYPE_TRAITS ) && gsl_HAVE( DEFAULT_FUNCTION_TEMPLATE_ARG ) \
        // && ! gsl_BETWEEN( gsl_COMPILER_CLANG_VERSION, 1, 400 ) && !          \
        // gsl_BETWEEN( gsl_COMPILER_APPLECLANG_VERSION, 1, 1001 )
#else   // a.k.a. ! gsl_HAVE( MOVE_FORWARD )
        template <class U>
        gsl_api gsl_constexpr14 not_null(U const &other) : data_(T(other)) {
            gsl_Expects(data_.ptr_ != gsl_nullptr);
        }
#endif  // gsl_HAVE( MOVE_FORWARD )
#endif  // gsl_CONFIG( NOT_NULL_EXPLICIT_CTOR )

    public:
#if gsl_HAVE(MOVE_FORWARD)
        // In Clang 3.x, `is_constructible<not_null<unique_ptr<X>>, unique_ptr<X>>`
        // tries to instantiate the copy constructor of `unique_ptr<>`, triggering
        // an error. Note that Apple Clang's `__clang_major__` etc. are different
        // from regular Clang.
#if gsl_HAVE(TYPE_TRAITS) && gsl_HAVE(DEFAULT_FUNCTION_TEMPLATE_ARG) && \
        !gsl_BETWEEN(gsl_COMPILER_CLANG_VERSION, 1, 400) &&             \
        !gsl_BETWEEN(gsl_COMPILER_APPLECLANG_VERSION, 1, 1001)
        template <class U
                  // We *have* to use SFINAE with an NTTP arg here, otherwise the
                  // overload is ambiguous.
                  ,
                  typename std::enable_if<(std::is_constructible<T, U>::value &&
                                           !std::is_convertible<U, T>::value),
                                          int>::type = 0>
        gsl_api gsl_constexpr14 explicit not_null(not_null<U> other)
                : data_(T(std::move(other.data_.ptr_))) {
            gsl_Expects(data_.ptr_ != gsl_nullptr);
        }

        template <class U
                  // We *have* to use SFINAE with an NTTP arg here, otherwise the
                  // overload is ambiguous.
                  ,
                  typename std::enable_if<(std::is_convertible<U, T>::value), int>::type = 0>
        gsl_api gsl_constexpr14 not_null(not_null<U> other)
                : data_(T(std::move(other.data_.ptr_))) {
            gsl_Expects(data_.ptr_ != gsl_nullptr);
        }
#else   // a.k.a. ! ( gsl_HAVE( TYPE_TRAITS ) && gsl_HAVE(        \
        // DEFAULT_FUNCTION_TEMPLATE_ARG ) && ! gsl_BETWEEN(      \
        // gsl_COMPILER_CLANG_VERSION, 1, 400 ) && ! gsl_BETWEEN( \
        // gsl_COMPILER_APPLECLANG_VERSION, 1, 1001 )                  \
        // If type_traits are not available, then we can't distinguish               \
        // `is_convertible<>` and `is_constructible<>`, so we unconditionally permit \
        // implicit construction.
        template <class U>
        gsl_api gsl_constexpr14 not_null(not_null<U> other)
                : data_(T(std::move(other.data_.ptr_))) {
            gsl_Expects(data_.ptr_ != gsl_nullptr);
        }
        template <class U>
        gsl_api gsl_constexpr14 not_null<T> &operator=(not_null<U> other) {
            gsl_Expects(other.data_.ptr_ != gsl_nullptr);
            data_.ptr_ = std::move(other.data_.ptr_);
            return *this;
        }
#endif  // gsl_HAVE( TYPE_TRAITS ) && gsl_HAVE( DEFAULT_FUNCTION_TEMPLATE_ARG ) \
        // && ! gsl_BETWEEN( gsl_COMPILER_CLANG_VERSION, 1, 400 ) && !          \
        // gsl_BETWEEN( gsl_COMPILER_APPLECLANG_VERSION, 1, 1001 )
#else   // a.k.a. ! gsl_HAVE( MOVE_FORWARD )
        template <class U>
        gsl_api gsl_constexpr14 not_null(not_null<U> const &other) : data_(T(other.data_.ptr_)) {
            gsl_Expects(data_.ptr_ != gsl_nullptr);
        }
        template <class U>
        gsl_api gsl_constexpr14 not_null<T> &operator=(not_null<U> const &other) {
            gsl_Expects(other.data_.ptr_ != gsl_nullptr);
            data_.ptr_ = other.data_.ptr_;
            return *this;
        }
#endif  // gsl_HAVE( MOVE_FORWARD )

#if gsl_CONFIG(TRANSPARENT_NOT_NULL)
        gsl_NODISCARD gsl_api gsl_constexpr14 element_type *get() const {
            element_type *result = data_.ptr_.get();
            gsl_Ensures(result != gsl_nullptr);
            return result;
        }
#else
#if gsl_CONFIG(NOT_NULL_GET_BY_CONST_REF)
        gsl_NODISCARD gsl_api gsl_constexpr14 T const &get() const {
            T const &result = data_.ptr_;
            gsl_Ensures(result != gsl_nullptr);
            return result;
        }
#else
        gsl_NODISCARD gsl_api gsl_constexpr14 T get() const {
            T result = data_.ptr_;
            gsl_Ensures(result != gsl_nullptr);
            return result;
        }
#endif
#endif

        // We want an implicit conversion operator that can be used to convert from
        // both lvalues (by const reference or by copy) and rvalues (by move). So it
        // seems like we could define
        //
        //     template< class U >
        //     operator U const &() const & { ... }
        //     template< class U >
        //     operator U &&() && { ... }
        //
        // However, having two conversion operators with different return types
        // renders the assignment operator of the result type ambiguous:
        //
        //     not_null<std::unique_ptr<T>> p( ... );
        //     std::unique_ptr<U> q;
        //     q = std::move( p ); // ambiguous
        //
        // To avoid this ambiguity, we have both overloads of the conversion
        // operator return `U` rather than `U const &` or `U &&`. This implies that
        // converting an lvalue always induces a copy, which can cause unnecessary
        // copies or even fail to compile in some situations:
        //
        //     not_null<std::shared_ptr<T>> sp( ... );
        //     std::shared_ptr<U> const & rs = sp; // unnecessary copy
        //     std::unique_ptr<U> const & ru = p; // error: cannot copy
        //     `unique_ptr<T>`
        //
        // However, these situations are rather unusual, and the following, more
        // frequent situations remain unimpaired:
        //
        //     std::shared_ptr<U> vs = sp; // no extra copy
        //     std::unique_ptr<U> vu = std::move( p );

#if gsl_HAVE(MOVE_FORWARD) && gsl_HAVE(TYPE_TRAITS) && gsl_HAVE(DEFAULT_FUNCTION_TEMPLATE_ARG) && \
        gsl_HAVE(EXPLICIT)
        // explicit conversion operator

        template <class U
                  // We *have* to use SFINAE with an NTTP arg here, otherwise the overload
                  // is ambiguous.
                  ,
                  typename std::enable_if<(std::is_constructible<U, T const &>::value &&
                                           !std::is_convertible<T, U>::value &&
                                           !detail::is_not_null_or_bool_oracle<U>::value),
                                          int>::type = 0>
        gsl_NODISCARD gsl_api gsl_constexpr14 explicit operator U() const
#if gsl_HAVE(FUNCTION_REF_QUALIFIER)
                &
#endif
        {
            U result(data_.ptr_);
            gsl_Ensures(result != gsl_nullptr);
            return result;
        }
#if gsl_HAVE(FUNCTION_REF_QUALIFIER)
        template <class U
                  // We *have* to use SFINAE with an NTTP arg here, otherwise the overload
                  // is ambiguous.
                  ,
                  typename std::enable_if<(std::is_constructible<U, T>::value &&
                                           !std::is_convertible<T, U>::value &&
                                           !detail::is_not_null_or_bool_oracle<U>::value),
                                          int>::type = 0>
        gsl_NODISCARD gsl_api gsl_constexpr14 explicit operator U() && {
            U result(std::move(data_.ptr_));
            gsl_Ensures(result != gsl_nullptr);
            return result;
        }
#endif

        // implicit conversion operator
        template <class U
                  // We *have* to use SFINAE with an NTTP arg here, otherwise the overload
                  // is ambiguous.
                  ,
                  typename std::enable_if<(std::is_constructible<U, T const &>::value &&
                                           std::is_convertible<T, U>::value &&
                                           !detail::is_not_null_or_bool_oracle<U>::value),
                                          int>::type = 0>
        gsl_NODISCARD gsl_api gsl_constexpr14 operator U() const
#if gsl_HAVE(FUNCTION_REF_QUALIFIER)
                &
#endif
        {
            U result(data_.ptr_);
            gsl_Ensures(result != gsl_nullptr);
            return result;
        }
#if gsl_HAVE(FUNCTION_REF_QUALIFIER)
        template <class U
                  // We *have* to use SFINAE with an NTTP arg here, otherwise the overload
                  // is ambiguous.
                  ,
                  typename std::enable_if<(std::is_convertible<T, U>::value &&
                                           !detail::is_not_null_or_bool_oracle<U>::value),
                                          int>::type = 0>
        gsl_NODISCARD gsl_api gsl_constexpr14 operator U() && {
            U result(std::move(data_.ptr_));
            gsl_Ensures(result != gsl_nullptr);
            return result;
        }
#endif
#else   // a.k.a. #if !( gsl_HAVE( MOVE_FORWARD ) && gsl_HAVE( TYPE_TRAITS ) && \
        // gsl_HAVE( DEFAULT_FUNCTION_TEMPLATE_ARG ) && gsl_HAVE( EXPLICIT ) )
        template <class U>
        gsl_NODISCARD gsl_api gsl_constexpr14 operator U() const {
            U result(data_.ptr_);
            gsl_Ensures(result != gsl_nullptr);
            return result;
        }
#endif  // gsl_HAVE( MOVE_FORWARD ) && gsl_HAVE( TYPE_TRAITS ) && gsl_HAVE( \
        // DEFAULT_FUNCTION_TEMPLATE_ARG ) && gsl_HAVE( EXPLICIT )

        gsl_NODISCARD gsl_api gsl_constexpr14 T const &operator->() const {
            T const &result(data_.ptr_);
            gsl_Ensures(result != gsl_nullptr);
            return result;
        }

        gsl_NODISCARD gsl_api gsl_constexpr14 element_type &operator*() const {
            gsl_Expects(data_.ptr_ != gsl_nullptr);
            return *data_.ptr_;
        }

#if gsl_HAVE(MOVE_FORWARD)
        // Visual C++ 2013 doesn't generate default move constructors, so we declare
        // them explicitly.
        gsl_api gsl_constexpr14 not_null(not_null &&other)
                gsl_noexcept_not_testing  // we want to be nothrow-movable despite the
                                          // precondition check
                : data_(std::move(other.data_)) {
            gsl_Expects(data_.ptr_ != gsl_nullptr);
        }
        gsl_api gsl_constexpr14 not_null &operator=(not_null &&other)
                gsl_noexcept_not_testing  // we want to be nothrow-movable despite the
                                          // precondition check
        {
            gsl_Expects(other.data_.ptr_ != gsl_nullptr || &other == this);
            data_ = std::move(other.data_);
            return *this;
        }
#endif  // gsl_HAVE( MOVE_FORWARD )

#if gsl_HAVE(IS_DEFAULT)
        gsl_constexpr14 not_null(not_null const &) = default;
        gsl_constexpr14 not_null &operator=(not_null const &) = default;
#endif

        gsl_api gsl_constexpr20 friend void swap(not_null &lhs, not_null &rhs)
                gsl_noexcept_not_testing  // we want to be nothrow-swappable despite the
                                          // precondition check
        {
            gsl_Expects(lhs.data_.ptr_ != gsl_nullptr && rhs.data_.ptr_ != gsl_nullptr);
            using std::swap;
            swap(lhs.data_.ptr_, rhs.data_.ptr_);
        }

        gsl_is_delete_access : not_null() gsl_is_delete;
        // prevent compilation when initialized with a nullptr or literal 0:
#if gsl_HAVE(NULLPTR)
        not_null(std::nullptr_t) gsl_is_delete;
        not_null &operator=(std::nullptr_t) gsl_is_delete;
#else
        not_null(int) gsl_is_delete;
        not_null &operator=(int) gsl_is_delete;
#endif

        // unwanted operators...pointers only point to single objects!
        not_null &operator++() gsl_is_delete;
        not_null &operator--() gsl_is_delete;
        not_null operator++(int) gsl_is_delete;
        not_null operator--(int) gsl_is_delete;
        not_null &operator+(size_t) gsl_is_delete;
        not_null &operator+=(size_t) gsl_is_delete;
        not_null &operator-(size_t) gsl_is_delete;
        not_null &operator-=(size_t) gsl_is_delete;
        not_null &operator+=(std::ptrdiff_t) gsl_is_delete;
        not_null &operator-=(std::ptrdiff_t) gsl_is_delete;
        void operator[](std::ptrdiff_t) const gsl_is_delete;
    };
#if gsl_CONFIG_DEFAULTS_VERSION >= 1
    template <class T>
    class not_null<T *> {
    private:
        detail::not_null_data<T *, true> data_;

        // need to access `not_null<U>::data_`
        template <class U>
        friend class not_null;

        template <class U>
        friend struct detail::not_null_accessor;

    public:
        typedef T element_type;

        gsl_api gsl_constexpr14
#if gsl_CONFIG(NOT_NULL_EXPLICIT_CTOR)
                explicit
#endif  // gsl_CONFIG( NOT_NULL_EXPLICIT_CTOR )
                not_null(T *other)
                : data_(other) {
            gsl_Expects(data_.ptr_ != gsl_nullptr);
        }

#if gsl_HAVE(MOVE_FORWARD)
        // In Clang 3.x, `is_constructible<not_null<unique_ptr<X>>, unique_ptr<X>>`
        // tries to instantiate the copy constructor of `unique_ptr<>`, triggering
        // an error. Note that Apple Clang's `__clang_major__` etc. are different
        // from regular Clang.
#if gsl_HAVE(TYPE_TRAITS) && gsl_HAVE(DEFAULT_FUNCTION_TEMPLATE_ARG) && \
        !gsl_BETWEEN(gsl_COMPILER_CLANG_VERSION, 1, 400) &&             \
        !gsl_BETWEEN(gsl_COMPILER_APPLECLANG_VERSION, 1, 1001)
        template <class U
                  // We *have* to use SFINAE with an NTTP arg here, otherwise the
                  // overload is ambiguous.
                  ,
                  typename std::enable_if<(std::is_constructible<T *, U>::value &&
                                           !std::is_convertible<U, T *>::value),
                                          int>::type = 0>
        gsl_api gsl_constexpr14 explicit not_null(not_null<U> other)
                : data_(static_cast<T *>(std::move(other.data_.ptr_))) {
            gsl_Expects(data_.ptr_ != gsl_nullptr);
        }

        template <class U
                  // We *have* to use SFINAE with an NTTP arg here, otherwise the
                  // overload is ambiguous.
                  ,
                  typename std::enable_if<(std::is_convertible<U, T *>::value), int>::type = 0>
        gsl_api gsl_constexpr14 not_null(not_null<U> other) : data_(std::move(other.data_.ptr_)) {
            gsl_Expects(data_.ptr_ != gsl_nullptr);
        }
#else   // a.k.a. ! ( gsl_HAVE( TYPE_TRAITS ) && gsl_HAVE(        \
        // DEFAULT_FUNCTION_TEMPLATE_ARG ) && ! gsl_BETWEEN(      \
        // gsl_COMPILER_CLANG_VERSION, 1, 400 ) && ! gsl_BETWEEN( \
        // gsl_COMPILER_APPLECLANG_VERSION, 1, 1001 )                  \
        // If type_traits are not available, then we can't distinguish               \
        // `is_convertible<>` and `is_constructible<>`, so we unconditionally permit \
        // implicit construction.
        template <class U>
        gsl_api gsl_constexpr14 not_null(not_null<U> other) : data_(std::move(other.data_.ptr_)) {
            gsl_Expects(data_.ptr_ != gsl_nullptr);
        }
        template <class U>
        gsl_api gsl_constexpr14 not_null<T *> &operator=(not_null<U> other) {
            gsl_Expects(other.data_.ptr_ != gsl_nullptr);
            data_.ptr_ = std::move(other.data_.ptr_);
            return *this;
        }
#endif  // gsl_HAVE( TYPE_TRAITS ) && gsl_HAVE( DEFAULT_FUNCTION_TEMPLATE_ARG ) \
        // && ! gsl_BETWEEN( gsl_COMPILER_CLANG_VERSION, 1, 400 ) && !          \
        // gsl_BETWEEN( gsl_COMPILER_APPLECLANG_VERSION, 1, 1001 )
#else   // a.k.a. ! gsl_HAVE( MOVE_FORWARD )
        template <class U>
        gsl_api gsl_constexpr14 not_null(not_null<U> const &other) : data_(other.data_.ptr_) {
            gsl_Expects(data_.ptr_ != gsl_nullptr);
        }
        template <class U>
        gsl_api gsl_constexpr14 not_null<T *> &operator=(not_null<U> const &other) {
            gsl_Expects(other.data_.ptr_ != gsl_nullptr);
            data_.ptr_ = other.data_.ptr_;
            return *this;
        }
#endif  // gsl_HAVE( MOVE_FORWARD )

#if !gsl_CONFIG(TRANSPARENT_NOT_NULL)
        gsl_NODISCARD gsl_api gsl_constexpr14 T *get() const { return data_.ptr_; }
#endif

#if gsl_HAVE(TYPE_TRAITS) && gsl_HAVE(DEFAULT_FUNCTION_TEMPLATE_ARG) && gsl_HAVE(EXPLICIT)
        // explicit conversion operator
        template <class U
                  // We *have* to use SFINAE with an NTTP arg here, otherwise the overload
                  // is ambiguous.
                  ,
                  typename std::enable_if<(std::is_constructible<U, T *>::value &&
                                           !std::is_convertible<T *, U>::value &&
                                           !detail::is_not_null_or_bool_oracle<U>::value),
                                          int>::type = 0>
        gsl_NODISCARD gsl_api gsl_constexpr14 explicit operator U() const {
            return U(data_.ptr_);
        }

        // implicit conversion operator
        template <class U
                  // We *have* to use SFINAE with an NTTP arg here, otherwise the overload
                  // is ambiguous.
                  ,
                  typename std::enable_if<(std::is_constructible<U, T *>::value &&
                                           std::is_convertible<T *, U>::value &&
                                           !detail::is_not_null_or_bool_oracle<U>::value),
                                          int>::type = 0>
        gsl_NODISCARD gsl_api gsl_constexpr14 operator U() const {
            return data_.ptr_;
        }
#else   // a.k.a. #if !( gsl_HAVE( MOVE_FORWARD ) && gsl_HAVE( TYPE_TRAITS ) && \
        // gsl_HAVE( DEFAULT_FUNCTION_TEMPLATE_ARG ) && gsl_HAVE( EXPLICIT ) )
        template <class U>
        gsl_NODISCARD gsl_api gsl_constexpr14 operator U() const {
            return data_.ptr_;
        }
#endif  // gsl_HAVE( MOVE_FORWARD ) && gsl_HAVE( TYPE_TRAITS ) && gsl_HAVE( \
        // DEFAULT_FUNCTION_TEMPLATE_ARG ) && gsl_HAVE( EXPLICIT )

        gsl_NODISCARD gsl_api gsl_constexpr14 T *operator->() const { return data_.ptr_; }

        gsl_NODISCARD gsl_api gsl_constexpr14 element_type &operator*() const {
            return *data_.ptr_;
        }

#if gsl_HAVE(IS_DEFAULT)
        gsl_constexpr14 not_null(not_null const &) = default;
        gsl_constexpr14 not_null &operator=(not_null const &) = default;
#endif

        gsl_api gsl_constexpr20 friend void swap(not_null &lhs, not_null &rhs) gsl_noexcept {
            using std::swap;
            swap(lhs.data_.ptr_, rhs.data_.ptr_);
        }

        gsl_is_delete_access : not_null() gsl_is_delete;
        // prevent compilation when initialized with a nullptr or literal 0:
#if gsl_HAVE(NULLPTR)
        not_null(std::nullptr_t) gsl_is_delete;
        not_null &operator=(std::nullptr_t) gsl_is_delete;
#else
        not_null(int) gsl_is_delete;
        not_null &operator=(int) gsl_is_delete;
#endif

        // unwanted operators...pointers only point to single objects!
        not_null &operator++() gsl_is_delete;
        not_null &operator--() gsl_is_delete;
        not_null operator++(int) gsl_is_delete;
        not_null operator--(int) gsl_is_delete;
        not_null &operator+(size_t) gsl_is_delete;
        not_null &operator+=(size_t) gsl_is_delete;
        not_null &operator-(size_t) gsl_is_delete;
        not_null &operator-=(size_t) gsl_is_delete;
        not_null &operator+=(std::ptrdiff_t) gsl_is_delete;
        not_null &operator-=(std::ptrdiff_t) gsl_is_delete;
        void operator[](std::ptrdiff_t) const gsl_is_delete;
    };
#endif  // gsl_CONFIG_DEFAULTS_VERSION >= 1
#if gsl_HAVE(DEDUCTION_GUIDES)
    template <class U>
    not_null(U) -> not_null<U>;
    template <class U>
    not_null(not_null<U>) -> not_null<U>;
#endif

#if gsl_HAVE(NULLPTR)
    void make_not_null(std::nullptr_t) gsl_is_delete;
#endif  // gsl_HAVE( NULLPTR )
#if gsl_HAVE(MOVE_FORWARD)
    template <class U>
    gsl_NODISCARD gsl_api gsl_constexpr14 not_null<U> make_not_null(U u) {
        return not_null<U>(std::move(u));
    }
    template <class U>
    gsl_NODISCARD gsl_api gsl_constexpr14 not_null<U> make_not_null(not_null<U> u) {
        return std::move(u);
    }
#else   // a.k.a. ! gsl_HAVE( MOVE_FORWARD )
    template <class U>
    gsl_NODISCARD gsl_api not_null<U> make_not_null(U const &u) {
        return not_null<U>(u);
    }
    template <class U>
    gsl_NODISCARD gsl_api not_null<U> make_not_null(not_null<U> const &u) {
        return u;
    }
#endif  // gsl_HAVE( MOVE_FORWARD )

    namespace detail {

    template <class T>
    struct as_nullable_helper {
        typedef T type;
    };
    template <class T>
    struct as_nullable_helper<not_null<T>> {};

    template <class T>
    struct not_null_accessor {
#if gsl_HAVE(MOVE_FORWARD)
        static gsl_api T get(not_null<T> &&p) gsl_noexcept { return std::move(p.data_.ptr_); }
#endif
        static gsl_api T const &get(not_null<T> const &p) gsl_noexcept { return p.data_.ptr_; }
    };

    namespace no_adl {

#if gsl_HAVE(MOVE_FORWARD)
    template <class T>
    gsl_NODISCARD gsl_api gsl_constexpr auto as_nullable(T &&p)
            gsl_noexcept_if(std::is_nothrow_move_constructible<T>::value) ->
            typename detail::as_nullable_helper<typename std20::remove_cvref<T>::type>::type {
        return std::move(p);
    }
    template <class T>
    gsl_NODISCARD gsl_api gsl_constexpr14 T as_nullable(not_null<T> &&p) {
        T result = detail::not_null_accessor<T>::get(std::move(p));
        gsl_Expects(result != gsl_nullptr);
        return result;
    }
#else   // ! gsl_HAVE( MOVE_FORWARD )
    template <class T>
    gsl_NODISCARD gsl_api gsl_constexpr T const &as_nullable(T const &p) gsl_noexcept {
        return p;
    }
#endif  // gsl_HAVE( MOVE_FORWARD )
    template <class T>
    gsl_NODISCARD gsl_api gsl_constexpr14 T const &as_nullable(not_null<T> const &p) {
        T const &result = detail::not_null_accessor<T>::get(p);
        gsl_Expects(result != gsl_nullptr);
        return result;
    }
    template <class T>
    gsl_NODISCARD gsl_api gsl_constexpr T *as_nullable(not_null<T *> p) gsl_noexcept {
        return detail::not_null_accessor<T *>::get(p);
    }

    }  // namespace no_adl
    }  // namespace detail

    using namespace detail::no_adl;

    // not_null with implicit constructor, allowing copy-initialization:

    template <class T>
    class not_null_ic : public not_null<T> {
    public:
        template <class U gsl_ENABLE_IF_((std::is_constructible<T, U>::value))>
        gsl_api gsl_constexpr14
#if gsl_HAVE(MOVE_FORWARD)
        not_null_ic(U &&u)
                : not_null<T>(std::forward<U>(u))
#else   // ! gsl_HAVE( MOVE_FORWARD )
        not_null_ic(U const &u)
                : not_null<T>(u)
#endif  // gsl_HAVE( MOVE_FORWARD )
        {
        }
    };

    // more not_null unwanted operators

    template <class T, class U>
    std::ptrdiff_t operator-(not_null<T> const &, not_null<U> const &) gsl_is_delete;

    template <class T>
    not_null<T> operator-(not_null<T> const &, std::ptrdiff_t) gsl_is_delete;

    template <class T>
    not_null<T> operator+(not_null<T> const &, std::ptrdiff_t) gsl_is_delete;

    template <class T>
    not_null<T> operator+(std::ptrdiff_t, not_null<T> const &) gsl_is_delete;

    // not_null comparisons

#if gsl_HAVE(NULLPTR) && gsl_HAVE(IS_DELETE)
    template <class T>
    gsl_constexpr bool operator==(not_null<T> const &, std::nullptr_t) = delete;
    template <class T>
    gsl_constexpr bool operator==(std::nullptr_t, not_null<T> const &) = delete;
    template <class T>
    gsl_constexpr bool operator!=(not_null<T> const &, std::nullptr_t) = delete;
    template <class T>
    gsl_constexpr bool operator!=(std::nullptr_t, not_null<T> const &) = delete;
#endif  // gsl_HAVE( NULLPTR ) && gsl_HAVE( IS_DELETE )

    template <class T, class U>
    gsl_NODISCARD inline gsl_api gsl_constexpr gsl_TRAILING_RETURN_TYPE_(bool) operator==(
            not_null<T> const &l, not_null<U> const &r)
            gsl_RETURN_DECLTYPE_(l.operator->() == r.operator->()) {
        return l.operator->() == r.operator->();
    }
    template <class T, class U>
    gsl_NODISCARD inline gsl_api gsl_constexpr gsl_TRAILING_RETURN_TYPE_(bool) operator==(
            not_null<T> const &l, U const &r) gsl_RETURN_DECLTYPE_(l.operator->() == r) {
        return l.operator->() == r;
    }
    template <class T, class U>
    gsl_NODISCARD inline gsl_api gsl_constexpr gsl_TRAILING_RETURN_TYPE_(bool) operator==(
            T const &l, not_null<U> const &r) gsl_RETURN_DECLTYPE_(l == r.operator->()) {
        return l == r.operator->();
    }

    template <class T, class U>
    gsl_NODISCARD inline gsl_api gsl_constexpr gsl_TRAILING_RETURN_TYPE_(bool) operator<(
            not_null<T> const &l, not_null<U> const &r)
            gsl_RETURN_DECLTYPE_(l.operator->() < r.operator->()) {
        return l.operator->() < r.operator->();
    }
    template <class T, class U>
    gsl_NODISCARD inline gsl_api gsl_constexpr gsl_TRAILING_RETURN_TYPE_(bool) operator<(
            not_null<T> const &l, U const &r) gsl_RETURN_DECLTYPE_(l.operator->() < r) {
        return l.operator->() < r;
    }
    template <class T, class U>
    gsl_NODISCARD inline gsl_api gsl_constexpr gsl_TRAILING_RETURN_TYPE_(bool) operator<(
            T const &l, not_null<U> const &r) gsl_RETURN_DECLTYPE_(l < r.operator->()) {
        return l < r.operator->();
    }

    template <class T, class U>
    gsl_NODISCARD inline gsl_api gsl_constexpr gsl_TRAILING_RETURN_TYPE_(bool) operator!=(
            not_null<T> const &l, not_null<U> const &r) gsl_RETURN_DECLTYPE_(!(l == r)) {
        return !(l == r);
    }
    template <class T, class U>
    gsl_NODISCARD inline gsl_api gsl_constexpr gsl_TRAILING_RETURN_TYPE_(bool) operator!=(
            not_null<T> const &l, U const &r) gsl_RETURN_DECLTYPE_(!(l == r)) {
        return !(l == r);
    }
    template <class T, class U>
    gsl_NODISCARD inline gsl_api gsl_constexpr gsl_TRAILING_RETURN_TYPE_(bool) operator!=(
            T const &l, not_null<U> const &r) gsl_RETURN_DECLTYPE_(!(l == r)) {
        return !(l == r);
    }

    template <class T, class U>
    gsl_NODISCARD inline gsl_api gsl_constexpr gsl_TRAILING_RETURN_TYPE_(bool) operator<=(
            not_null<T> const &l, not_null<U> const &r) gsl_RETURN_DECLTYPE_(!(r < l)) {
        return !(r < l);
    }
    template <class T, class U>
    gsl_NODISCARD inline gsl_api gsl_constexpr gsl_TRAILING_RETURN_TYPE_(bool) operator<=(
            not_null<T> const &l, U const &r) gsl_RETURN_DECLTYPE_(!(r < l)) {
        return !(r < l);
    }
    template <class T, class U>
    gsl_NODISCARD inline gsl_api gsl_constexpr gsl_TRAILING_RETURN_TYPE_(bool) operator<=(
            T const &l, not_null<U> const &r) gsl_RETURN_DECLTYPE_(!(r < l)) {
        return !(r < l);
    }

    template <class T, class U>
    gsl_NODISCARD inline gsl_api gsl_constexpr gsl_TRAILING_RETURN_TYPE_(bool) operator>(
            not_null<T> const &l, not_null<U> const &r) gsl_RETURN_DECLTYPE_(r < l) {
        return r < l;
    }
    template <class T, class U>
    gsl_NODISCARD inline gsl_api gsl_constexpr gsl_TRAILING_RETURN_TYPE_(bool) operator>(
            not_null<T> const &l, U const &r) gsl_RETURN_DECLTYPE_(r < l) {
        return r < l;
    }
    template <class T, class U>
    gsl_NODISCARD inline gsl_api gsl_constexpr gsl_TRAILING_RETURN_TYPE_(bool) operator>(
            T const &l, not_null<U> const &r) gsl_RETURN_DECLTYPE_(r < l) {
        return r < l;
    }

    template <class T, class U>
    gsl_NODISCARD inline gsl_api gsl_constexpr gsl_TRAILING_RETURN_TYPE_(bool) operator>=(
            not_null<T> const &l, not_null<U> const &r) gsl_RETURN_DECLTYPE_(!(l < r)) {
        return !(l < r);
    }
    template <class T, class U>
    gsl_NODISCARD inline gsl_api gsl_constexpr gsl_TRAILING_RETURN_TYPE_(bool) operator>=(
            not_null<T> const &l, U const &r) gsl_RETURN_DECLTYPE_(!(l < r)) {
        return !(l < r);
    }
    template <class T, class U>
    gsl_NODISCARD inline gsl_api gsl_constexpr gsl_TRAILING_RETURN_TYPE_(bool) operator>=(
            T const &l, not_null<U> const &r) gsl_RETURN_DECLTYPE_(!(l < r)) {
        return !(l < r);
    }

    // print not_null

    template <class CharType, class Traits, class T>
    std::basic_ostream<CharType, Traits> &operator<<(std::basic_ostream<CharType, Traits> &os,
                                                     not_null<T> const &p) {
        return os << p.operator->();
    }

//
// Byte-specific type.
//
#if gsl_HAVE(ENUM_CLASS_CONSTRUCTION_FROM_UNDERLYING_TYPE)
    enum class gsl_may_alias byte : unsigned char {};
#else
    struct gsl_may_alias byte {
        typedef unsigned char type;
        type v;
    };
#endif

    template <class T>
    gsl_NODISCARD gsl_api inline gsl_constexpr byte to_byte(T v) gsl_noexcept {
#if gsl_HAVE(ENUM_CLASS_CONSTRUCTION_FROM_UNDERLYING_TYPE)
        return static_cast<byte>(v);
#elif gsl_HAVE(CONSTEXPR_11)
        return {static_cast<typename byte::type>(v)};
#else
        byte b = {static_cast<typename byte::type>(v)};
        return b;
#endif
    }

    template <class IntegerType gsl_ENABLE_IF_((std::is_integral<IntegerType>::value))>
    gsl_NODISCARD gsl_api inline gsl_constexpr IntegerType to_integer(byte b) gsl_noexcept {
#if gsl_HAVE(ENUM_CLASS_CONSTRUCTION_FROM_UNDERLYING_TYPE)
        return static_cast<typename std::underlying_type<byte>::type>(b);
#else
        return b.v;
#endif
    }

    gsl_NODISCARD gsl_api inline gsl_constexpr unsigned char to_uchar(byte b) gsl_noexcept {
        return to_integer<unsigned char>(b);
    }

    gsl_NODISCARD gsl_api inline gsl_constexpr unsigned char to_uchar(int i) gsl_noexcept {
        return static_cast<unsigned char>(i);
    }

    template <class IntegerType gsl_ENABLE_IF_((std::is_integral<IntegerType>::value))>
    gsl_api inline gsl_constexpr14 byte &operator<<=(byte &b, IntegerType shift) gsl_noexcept {
#if gsl_HAVE(ENUM_CLASS_CONSTRUCTION_FROM_UNDERLYING_TYPE)
        return b = ::gsl::to_byte(::gsl::to_uchar(b) << shift);
#else
        b.v = ::gsl::to_uchar(b.v << shift);
        return b;
#endif
    }

    template <class IntegerType gsl_ENABLE_IF_((std::is_integral<IntegerType>::value))>
    gsl_NODISCARD gsl_api inline gsl_constexpr byte operator<<(byte b, IntegerType shift)
            gsl_noexcept {
        return ::gsl::to_byte(::gsl::to_uchar(b) << shift);
    }

    template <class IntegerType gsl_ENABLE_IF_((std::is_integral<IntegerType>::value))>
    gsl_NODISCARD gsl_api inline gsl_constexpr14 byte &operator>>=(byte &b, IntegerType shift)
            gsl_noexcept {
#if gsl_HAVE(ENUM_CLASS_CONSTRUCTION_FROM_UNDERLYING_TYPE)
        return b = ::gsl::to_byte(::gsl::to_uchar(b) >> shift);
#else
        b.v = ::gsl::to_uchar(b.v >> shift);
        return b;
#endif
    }

    template <class IntegerType gsl_ENABLE_IF_((std::is_integral<IntegerType>::value))>
    gsl_NODISCARD gsl_api inline gsl_constexpr byte operator>>(byte b, IntegerType shift)
            gsl_noexcept {
        return ::gsl::to_byte(::gsl::to_uchar(b) >> shift);
    }

#if gsl_HAVE(ENUM_CLASS_CONSTRUCTION_FROM_UNDERLYING_TYPE)
    gsl_DEFINE_ENUM_BITMASK_OPERATORS(byte) gsl_DEFINE_ENUM_RELATIONAL_OPERATORS(byte)
#else   // a.k.a. !gsl_HAVE( ENUM_CLASS_CONSTRUCTION_FROM_UNDERLYING_TYPE )
    gsl_api inline gsl_constexpr bool operator==(byte l, byte r) gsl_noexcept { return l.v == r.v; }

    gsl_api inline gsl_constexpr bool operator!=(byte l, byte r) gsl_noexcept { return !(l == r); }

    gsl_api inline gsl_constexpr bool operator<(byte l, byte r) gsl_noexcept { return l.v < r.v; }

    gsl_api inline gsl_constexpr bool operator<=(byte l, byte r) gsl_noexcept { return !(r < l); }

    gsl_api inline gsl_constexpr bool operator>(byte l, byte r) gsl_noexcept { return (r < l); }

    gsl_api inline gsl_constexpr bool operator>=(byte l, byte r) gsl_noexcept { return !(l < r); }

    gsl_api inline gsl_constexpr14 byte &operator|=(byte &l, byte r) gsl_noexcept {
        l.v |= r.v;
        return l;
    }

    gsl_api inline gsl_constexpr byte operator|(byte l, byte r) gsl_noexcept {
        return ::gsl::to_byte(l.v | r.v);
    }

    gsl_api inline gsl_constexpr14 byte &operator&=(byte &l, byte r) gsl_noexcept {
        l.v &= r.v;
        return l;
    }

    gsl_api inline gsl_constexpr byte operator&(byte l, byte r) gsl_noexcept {
        return ::gsl::to_byte(l.v & r.v);
    }

    gsl_api inline gsl_constexpr14 byte &operator^=(byte &l, byte r) gsl_noexcept {
        l.v ^= r.v;
        return l;
    }

    gsl_api inline gsl_constexpr byte operator^(byte l, byte r) gsl_noexcept {
        return ::gsl::to_byte(l.v ^ r.v);
    }

    gsl_api inline gsl_constexpr byte operator~(byte b) gsl_noexcept {
        return ::gsl::to_byte(~b.v);
    }
#endif  // gsl_HAVE( ENUM_CLASS_CONSTRUCTION_FROM_UNDERLYING_TYPE )

#if gsl_FEATURE_TO_STD(WITH_CONTAINER)

            // Tag to select span constructor taking a container:

            struct with_container_t {
        gsl_constexpr with_container_t() gsl_noexcept {}
    };
    const gsl_constexpr with_container_t
            with_container;  // TODO: this can lead to ODR violations because the
                             // symbol will be defined in multiple translation units

#endif

    namespace detail {

    template <class T>
    gsl_api gsl_constexpr14 T *endptr(T *data, gsl_CONFIG_SPAN_INDEX_TYPE size) {
        // Be sure to run the check before doing pointer arithmetics, which would be
        // UB for `nullptr` and non-0 integers.
        gsl_Expects(size == 0 || data != gsl_nullptr);
        return data + size;
    }

    }  // namespace detail

    //
    // span<> - A 1D view of contiguous T's, replace (*,len).
    //
    template <class T>
    class span {
        template <class U>
        friend class span;

    public:
        typedef gsl_CONFIG_SPAN_INDEX_TYPE index_type;

        typedef T element_type;
        typedef typename std11::remove_cv<T>::type value_type;

        typedef T &reference;
        typedef T *pointer;
        typedef T const *const_pointer;
        typedef T const &const_reference;

        typedef pointer iterator;
        typedef const_pointer const_iterator;

        typedef std::reverse_iterator<iterator> reverse_iterator;
        typedef std::reverse_iterator<const_iterator> const_reverse_iterator;

        typedef gsl_CONFIG_SPAN_INDEX_TYPE size_type;
        typedef std::ptrdiff_t difference_type;

        // 26.7.3.2 Constructors, copy, and assignment [span.cons]

        gsl_api gsl_constexpr span() gsl_noexcept : first_(gsl_nullptr), last_(gsl_nullptr) {}

#if !gsl_DEPRECATE_TO_LEVEL(5)

#if gsl_HAVE(NULLPTR)
        gsl_api gsl_constexpr14 span(std::nullptr_t, index_type size_in)
                : first_(nullptr), last_(nullptr) {
            gsl_Expects(size_in == 0);
        }
#endif

#if gsl_HAVE(IS_DELETE)
        gsl_DEPRECATED gsl_api gsl_constexpr span(reference data_in) : span(&data_in, 1) {}

        gsl_api gsl_constexpr span(element_type &&) = delete;
#endif

#endif  // deprecate

        gsl_api gsl_constexpr14 span(pointer data_in, index_type size_in)
                : first_(data_in), last_(detail::endptr(data_in, size_in)) {}

        gsl_api gsl_constexpr14 span(pointer first_in, pointer last_in)
                : first_(first_in), last_(last_in) {
            gsl_Expects(first_in <= last_in);
        }

#if !gsl_DEPRECATE_TO_LEVEL(5)

        template <class U>
        gsl_api gsl_constexpr14 span(U *data_in, index_type size_in)
                : first_(data_in), last_(detail::endptr(data_in, size_in)) {}

#endif  // deprecate

#if !gsl_DEPRECATE_TO_LEVEL(5)
        template <class U, size_t N>
        gsl_api gsl_constexpr span(U (&arr)[N]) gsl_noexcept : first_(gsl_ADDRESSOF(arr[0])),
                                                               last_(gsl_ADDRESSOF(arr[0]) + N) {}
#else
        template <size_t N gsl_ENABLE_IF_(
                (std::is_convertible<value_type (*)[], element_type (*)[]>::value))>
        gsl_api gsl_constexpr span(element_type (&arr)[N]) gsl_noexcept
                : first_(gsl_ADDRESSOF(arr[0])),
                  last_(gsl_ADDRESSOF(arr[0]) + N) {}
#endif  // deprecate

#if gsl_HAVE(ARRAY)
#if !gsl_DEPRECATE_TO_LEVEL(5)

        template <class U, size_t N>
        gsl_api gsl_constexpr span(std::array<U, N> &arr)
                : first_(arr.data()), last_(arr.data() + N) {}

        template <class U, size_t N>
        gsl_api gsl_constexpr span(std::array<U, N> const &arr)
                : first_(arr.data()), last_(arr.data() + N) {}

#else

        template <size_t N gsl_ENABLE_IF_(
                (std::is_convertible<value_type (*)[], element_type (*)[]>::value))>
        gsl_constexpr span(std::array<value_type, N> &arr)
                : first_(arr.data()), last_(arr.data() + N) {}

        template <size_t N gsl_ENABLE_IF_(
                (std::is_convertible<value_type (*)[], element_type (*)[]>::value))>
        gsl_constexpr span(std::array<value_type, N> const &arr)
                : first_(arr.data()), last_(arr.data() + N) {}

#endif  // deprecate
#endif  // gsl_HAVE( ARRAY )

#if gsl_HAVE(CONSTRAINED_SPAN_CONTAINER_CTOR)
        template <class Container gsl_ENABLE_IF_(
                (detail::is_compatible_container<Container, element_type>::value))>
        gsl_api gsl_constexpr span(Container &cont) gsl_noexcept
                : first_(std17::data(cont)),
                  last_(std17::data(cont) + std17::size(cont)) {}

        template <class Container gsl_ENABLE_IF_(
                (std::is_const<element_type>::value &&
                 detail::is_compatible_container<Container, element_type>::value))>
        gsl_api gsl_constexpr span(Container const &cont) gsl_noexcept
                : first_(std17::data(cont)),
                  last_(std17::data(cont) + std17::size(cont)) {}

#elif gsl_HAVE(UNCONSTRAINED_SPAN_CONTAINER_CTOR)

        template <class Container>
        gsl_constexpr span(Container &cont)
                : first_(cont.size() == 0 ? gsl_nullptr : gsl_ADDRESSOF(cont[0])),
                  last_(cont.size() == 0 ? gsl_nullptr : gsl_ADDRESSOF(cont[0]) + cont.size()) {}

        template <class Container>
        gsl_constexpr span(Container const &cont)
                : first_(cont.size() == 0 ? gsl_nullptr : gsl_ADDRESSOF(cont[0])),
                  last_(cont.size() == 0 ? gsl_nullptr : gsl_ADDRESSOF(cont[0]) + cont.size()) {}

#endif

#if gsl_FEATURE_TO_STD(WITH_CONTAINER)

        template <class Container>
        gsl_constexpr span(with_container_t, Container &cont) gsl_noexcept
                : first_(cont.size() == 0 ? gsl_nullptr : gsl_ADDRESSOF(cont[0])),
                  last_(cont.size() == 0 ? gsl_nullptr : gsl_ADDRESSOF(cont[0]) + cont.size()) {}

        template <class Container>
        gsl_constexpr span(with_container_t, Container const &cont) gsl_noexcept
                : first_(cont.size() == 0 ? gsl_nullptr : gsl_ADDRESSOF(cont[0])),
                  last_(cont.size() == 0 ? gsl_nullptr : gsl_ADDRESSOF(cont[0]) + cont.size()) {}

#endif

#if !gsl_DEPRECATE_TO_LEVEL(4)
        // constructor taking shared_ptr deprecated since 0.29.0

#if gsl_HAVE(SHARED_PTR)
        gsl_DEPRECATED gsl_constexpr span(shared_ptr<element_type> const &ptr)
                : first_(ptr.get()), last_(ptr.get() ? ptr.get() + 1 : gsl_nullptr) {}
#endif

        // constructors taking unique_ptr deprecated since 0.29.0

#if gsl_HAVE(UNIQUE_PTR)
#if gsl_HAVE(DEFAULT_FUNCTION_TEMPLATE_ARG)
        template <class ArrayElementType = typename std::add_pointer<element_type>::type>
#else
        template <class ArrayElementType>
#endif
        gsl_DEPRECATED gsl_constexpr span(unique_ptr<ArrayElementType> const &ptr, index_type count)
                : first_(ptr.get()), last_(ptr.get() + count) {
        }

        gsl_DEPRECATED gsl_constexpr span(unique_ptr<element_type> const &ptr)
                : first_(ptr.get()), last_(ptr.get() ? ptr.get() + 1 : gsl_nullptr) {}
#endif

#endif  // deprecate shared_ptr, unique_ptr

#if gsl_HAVE(IS_DEFAULT) && !gsl_BETWEEN(gsl_COMPILER_GNUC_VERSION, 430, 600)
        gsl_constexpr span(span &&) gsl_noexcept = default;
        gsl_constexpr span(span const &) = default;
#else
        gsl_api gsl_constexpr span(span const &other) : first_(other.begin()), last_(other.end()) {}
#endif

#if gsl_HAVE(IS_DEFAULT)
        gsl_constexpr14 span &operator=(span &&) gsl_noexcept = default;
        gsl_constexpr14 span &operator=(span const &) gsl_noexcept = default;
#else
        gsl_constexpr14 span &operator=(span other) gsl_noexcept {
            first_ = other.first_;
            last_ = other.last_;
            return *this;
        }
#endif

        template <class U gsl_ENABLE_IF_((std::is_convertible<U (*)[], element_type (*)[]>::value))>
        gsl_api gsl_constexpr span(span<U> const &other)
                : first_(other.begin()), last_(other.end()) {}

#if 0
    // Converting from other span ?
    template< class U > operator=();
#endif

        // 26.7.3.3 Subviews [span.sub]

        gsl_NODISCARD gsl_api gsl_constexpr14 span first(index_type count) const {
            gsl_Expects(std::size_t(count) <= std::size_t(this->size()));
            return span(this->data(), count);
        }

        gsl_NODISCARD gsl_api gsl_constexpr14 span last(index_type count) const {
            gsl_Expects(std::size_t(count) <= std::size_t(this->size()));
            return span(this->data() + this->size() - count, count);
        }

        gsl_NODISCARD gsl_api gsl_constexpr14 span subspan(index_type offset) const {
            gsl_Expects(std::size_t(offset) <= std::size_t(this->size()));
            return span(this->data() + offset, this->size() - offset);
        }

        gsl_NODISCARD gsl_api gsl_constexpr14 span subspan(index_type offset,
                                                           index_type count) const {
            gsl_Expects(std::size_t(offset) <= std::size_t(this->size()) &&
                        std::size_t(count) <= std::size_t(this->size() - offset));
            return span(this->data() + offset, count);
        }

        // 26.7.3.4 Observers [span.obs]

        gsl_NODISCARD gsl_api gsl_constexpr index_type size() const gsl_noexcept {
            return narrow_cast<index_type>(last_ - first_);
        }

        gsl_NODISCARD gsl_api gsl_constexpr std::ptrdiff_t ssize() const gsl_noexcept {
            return narrow_cast<std::ptrdiff_t>(last_ - first_);
        }

        gsl_NODISCARD gsl_api gsl_constexpr index_type size_bytes() const gsl_noexcept {
            return size() * narrow_cast<index_type>(sizeof(element_type));
        }

        gsl_NODISCARD gsl_api gsl_constexpr bool empty() const gsl_noexcept { return size() == 0; }

        // 26.7.3.5 Element access [span.elem]

        gsl_NODISCARD gsl_api gsl_constexpr14 reference operator[](index_type pos) const {
            gsl_Expects(pos < size());
            return first_[pos];
        }

#if !gsl_DEPRECATE_TO_LEVEL(6)
        gsl_DEPRECATED_MSG("use subscript indexing instead") gsl_api gsl_constexpr14 reference
        operator()(index_type pos) const {
            return (*this)[pos];
        }

        gsl_DEPRECATED_MSG("use subscript indexing instead") gsl_api gsl_constexpr14 reference
                at(index_type pos) const {
            return (*this)[pos];
        }
#endif  // deprecate

        gsl_NODISCARD gsl_api gsl_constexpr14 reference front() const {
            gsl_Expects(first_ != last_);
            return *first_;
        }

        gsl_NODISCARD gsl_api gsl_constexpr14 reference back() const {
            gsl_Expects(first_ != last_);
            return *(last_ - 1);
        }

        gsl_NODISCARD gsl_api gsl_constexpr pointer data() const gsl_noexcept { return first_; }

        // 26.7.3.6 Iterator support [span.iterators]

        gsl_NODISCARD gsl_api gsl_constexpr iterator begin() const gsl_noexcept {
            return iterator(first_);
        }

        gsl_NODISCARD gsl_api gsl_constexpr iterator end() const gsl_noexcept {
            return iterator(last_);
        }

        gsl_NODISCARD gsl_api gsl_constexpr const_iterator cbegin() const gsl_noexcept {
#if gsl_CPP11_OR_GREATER
            return {begin()};
#else
            return const_iterator(begin());
#endif
        }

        gsl_NODISCARD gsl_api gsl_constexpr const_iterator cend() const gsl_noexcept {
#if gsl_CPP11_OR_GREATER
            return {end()};
#else
            return const_iterator(end());
#endif
        }

        gsl_NODISCARD gsl_constexpr17 reverse_iterator rbegin() const gsl_noexcept {
            return reverse_iterator(end());
        }

        gsl_NODISCARD gsl_constexpr17 reverse_iterator rend() const gsl_noexcept {
            return reverse_iterator(begin());
        }

        gsl_NODISCARD gsl_constexpr17 const_reverse_iterator crbegin() const gsl_noexcept {
            return const_reverse_iterator(cend());
        }

        gsl_NODISCARD gsl_constexpr17 const_reverse_iterator crend() const gsl_noexcept {
            return const_reverse_iterator(cbegin());
        }

        gsl_constexpr14 void swap(span &other) gsl_noexcept {
            std::swap(first_, other.first_);
            std::swap(last_, other.last_);
        }

#if !gsl_DEPRECATE_TO_LEVEL(3)
        // member length() deprecated since 0.29.0

        gsl_DEPRECATED_MSG("use size() instead") gsl_api gsl_constexpr index_type
                length() const gsl_noexcept {
            return size();
        }

        // member length_bytes() deprecated since 0.29.0

        gsl_DEPRECATED_MSG("use size_bytes() instead") gsl_api gsl_constexpr index_type
                length_bytes() const gsl_noexcept {
            return size_bytes();
        }
#endif

#if !gsl_DEPRECATE_TO_LEVEL(2)
        // member as_bytes(), as_writeable_bytes deprecated since 0.17.0

        gsl_DEPRECATED_MSG("use free function gsl::as_bytes() instead")
                gsl_api span<const byte> as_bytes() const gsl_noexcept {
            return span<const byte>(reinterpret_cast<const byte *>(data()),
                                    size_bytes());  // NOLINT
        }

        gsl_DEPRECATED_MSG("use free function gsl::as_writable_bytes() instead")
                gsl_api span<byte> as_writeable_bytes() const gsl_noexcept {
            return span<byte>(reinterpret_cast<byte *>(data()),
                              size_bytes());  // NOLINT
        }

#endif

        template <class U>
        gsl_NODISCARD gsl_api span<U> as_span() const {
            gsl_Expects((this->size_bytes() % sizeof(U)) == 0);
            return span<U>(reinterpret_cast<U *>(this->data()),
                           this->size_bytes() / sizeof(U));  // NOLINT
        }

    private:
        pointer first_;
        pointer last_;
    };

    // class template argument deduction guides:

#if gsl_HAVE(DEDUCTION_GUIDES)  // gsl_CPP17_OR_GREATER

    template <class T, size_t N>
    span(T(&)[N]) -> span<T /*, N*/>;

    template <class T, size_t N>
    span(std::array<T, N> &) -> span<T /*, N*/>;

    template <class T, size_t N>
    span(std::array<T, N> const &) -> span<const T /*, N*/>;

    template <class Container>
    span(Container &) -> span<typename Container::value_type>;

    template <class Container>
    span(Container const &) -> span<const typename Container::value_type>;

#endif  // gsl_HAVE( DEDUCTION_GUIDES )

    // 26.7.3.7 Comparison operators [span.comparison]

#if gsl_CONFIG(ALLOWS_SPAN_COMPARISON)
#if gsl_CONFIG(ALLOWS_NONSTRICT_SPAN_COMPARISON)

    template <class T, class U>
    gsl_SUPPRESS_MSGSL_WARNING(stl .1) gsl_NODISCARD inline gsl_constexpr bool operator==(
            span<T> const &l, span<U> const &r) {
        return l.size() == r.size() &&
               (l.begin() == r.begin() || std98::equal(l.begin(), l.end(), r.begin()));
    }

    template <class T, class U>
    gsl_SUPPRESS_MSGSL_WARNING(stl .1) gsl_NODISCARD inline gsl_constexpr bool operator<(
            span<T> const &l, span<U> const &r) {
        return std98::lexicographical_compare(l.begin(), l.end(), r.begin(), r.end());
    }

#else   // a.k.a. !gsl_CONFIG( ALLOWS_NONSTRICT_SPAN_COMPARISON )

    template <class T>
    gsl_SUPPRESS_MSGSL_WARNING(stl .1) gsl_NODISCARD inline gsl_constexpr bool operator==(
            span<T> const &l, span<T> const &r) {
        return l.size() == r.size() &&
               (l.begin() == r.begin() || std98::equal(l.begin(), l.end(), r.begin()));
    }

    template <class T>
    gsl_SUPPRESS_MSGSL_WARNING(stl .1) gsl_NODISCARD inline gsl_constexpr bool operator<(
            span<T> const &l, span<T> const &r) {
        return std98::lexicographical_compare(l.begin(), l.end(), r.begin(), r.end());
    }
#endif  // gsl_CONFIG( ALLOWS_NONSTRICT_SPAN_COMPARISON )

    template <class T, class U>
    gsl_NODISCARD inline gsl_constexpr bool operator!=(span<T> const &l, span<U> const &r) {
        return !(l == r);
    }

    template <class T, class U>
    gsl_NODISCARD inline gsl_constexpr bool operator<=(span<T> const &l, span<U> const &r) {
        return !(r < l);
    }

    template <class T, class U>
    gsl_NODISCARD inline gsl_constexpr bool operator>(span<T> const &l, span<U> const &r) {
        return (r < l);
    }

    template <class T, class U>
    gsl_NODISCARD inline gsl_constexpr bool operator>=(span<T> const &l, span<U> const &r) {
        return !(l < r);
    }
#endif  // gsl_CONFIG( ALLOWS_SPAN_COMPARISON )

    // span algorithms

    template <class T>
    gsl_NODISCARD gsl_api inline gsl_constexpr std::size_t size(span<T> const &spn) {
        return static_cast<std::size_t>(spn.size());
    }

    template <class T>
    gsl_NODISCARD gsl_api inline gsl_constexpr std::ptrdiff_t ssize(span<T> const &spn) {
        return spn.ssize();
    }

    namespace detail {

    template <class II, class N, class OI>
    gsl_api gsl_constexpr14 inline OI copy_n(II first, N count, OI result) {
        if (count > 0) {
            *result++ = *first;
            for (N i = 1; i < count; ++i) {
                *result++ = *++first;
            }
        }
        return result;
    }
    }  // namespace detail

    template <class T, class U>
    gsl_api gsl_constexpr14 inline void copy(span<T> src, span<U> dest) {
#if gsl_CPP14_OR_GREATER  // gsl_HAVE( TYPE_TRAITS ) (circumvent Travis \
                          // clang 3.4)
        static_assert(std::is_assignable<U &, T const &>::value,
                      "Cannot assign elements of source span to elements of "
                      "destination span");
#endif
        gsl_Expects(dest.size() >= src.size());
        detail::copy_n(src.data(), src.size(), dest.data());
    }

    // span creator functions (see ctors)

    template <class T>
    gsl_NODISCARD gsl_api inline span<const byte> as_bytes(span<T> spn) gsl_noexcept {
        return span<const byte>(reinterpret_cast<const byte *>(spn.data()),
                                spn.size_bytes());  // NOLINT
    }

    template <class T>
    gsl_NODISCARD gsl_api inline span<byte> as_writable_bytes(span<T> spn) gsl_noexcept {
        return span<byte>(reinterpret_cast<byte *>(spn.data()),
                          spn.size_bytes());  // NOLINT
    }

#if !gsl_DEPRECATE_TO_LEVEL(6)
    template <class T>
    gsl_DEPRECATED_MSG("use as_writable_bytes() (different spelling) instead")
            gsl_api inline span<byte>
            as_writeable_bytes(span<T> spn) gsl_noexcept {
        return span<byte>(reinterpret_cast<byte *>(spn.data()),
                          spn.size_bytes());  // NOLINT
    }
#endif  // deprecate

#if gsl_FEATURE_TO_STD(MAKE_SPAN)

    template <class T>
    gsl_NODISCARD gsl_api inline gsl_constexpr span<T> make_span(
            T * ptr, typename span<T>::index_type count) {
        return span<T>(ptr, count);
    }

    template <class T>
    gsl_NODISCARD gsl_api inline gsl_constexpr span<T> make_span(T * first, T * last) {
        return span<T>(first, last);
    }

    template <class T, size_t N>
    gsl_NODISCARD inline gsl_constexpr span<T> make_span(T(&arr)[N]) {
        return span<T>(gsl_ADDRESSOF(arr[0]), N);
    }

#if gsl_HAVE(ARRAY)

    template <class T, size_t N>
    gsl_NODISCARD inline gsl_constexpr span<T> make_span(std::array<T, N> & arr) {
        return span<T>(arr);
    }

    template <class T, size_t N>
    gsl_NODISCARD inline gsl_constexpr span<const T> make_span(std::array<T, N> const &arr) {
        return span<const T>(arr);
    }
#endif

#if gsl_HAVE(CONSTRAINED_SPAN_CONTAINER_CTOR) && gsl_HAVE(AUTO)

    template <class Container, class EP = decltype(std17::data(std::declval<Container &>()))>
    gsl_NODISCARD inline gsl_constexpr auto make_span(Container & cont)
            ->span<typename std::remove_pointer<EP>::type> {
        return span<typename std::remove_pointer<EP>::type>(cont);
    }

    template <class Container, class EP = decltype(std17::data(std::declval<Container &>()))>
    gsl_NODISCARD inline gsl_constexpr auto make_span(Container const &cont)
            ->span<const typename std::remove_pointer<EP>::type> {
        return span<const typename std::remove_pointer<EP>::type>(cont);
    }

#else

    template <class T>
    inline span<T> make_span(std::vector<T> & cont) {
        return span<T>(with_container, cont);
    }

    template <class T>
    inline span<const T> make_span(std::vector<T> const &cont) {
        return span<const T>(with_container, cont);
    }
#endif

#if gsl_FEATURE_TO_STD(WITH_CONTAINER)

    template <class Container>
    gsl_NODISCARD inline gsl_constexpr span<typename Container::value_type> make_span(
            with_container_t, Container & cont) gsl_noexcept {
        return span<typename Container::value_type>(with_container, cont);
    }

    template <class Container>
    gsl_NODISCARD inline gsl_constexpr span<const typename Container::value_type> make_span(
            with_container_t, Container const &cont) gsl_noexcept {
        return span<const typename Container::value_type>(with_container, cont);
    }

#endif  // gsl_FEATURE_TO_STD( WITH_CONTAINER )

#if !gsl_DEPRECATE_TO_LEVEL(4)
    template <class Ptr>
    gsl_DEPRECATED inline span<typename Ptr::element_type> make_span(Ptr & ptr) {
        return span<typename Ptr::element_type>(ptr);
    }
#endif  // !gsl_DEPRECATE_TO_LEVEL( 4 )

    template <class Ptr>
    gsl_DEPRECATED inline span<typename Ptr::element_type> make_span(
            Ptr & ptr, typename span<typename Ptr::element_type>::index_type count) {
        return span<typename Ptr::element_type>(ptr, count);
    }

#endif  // gsl_FEATURE_TO_STD( MAKE_SPAN )

#if gsl_FEATURE_TO_STD(BYTE_SPAN)

    template <class T>
    gsl_NODISCARD gsl_api inline gsl_constexpr span<byte> byte_span(T & t) gsl_noexcept {
        return span<byte>(reinterpret_cast<byte *>(&t), sizeof(T));
    }

    template <class T>
    gsl_NODISCARD gsl_api inline gsl_constexpr span<const byte> byte_span(T const &t) gsl_noexcept {
        return span<const byte>(reinterpret_cast<byte const *>(&t), sizeof(T));
    }

#endif  // gsl_FEATURE_TO_STD( BYTE_SPAN )

    //
    // basic_string_span:
    //

    template <class T>
    class basic_string_span;

    namespace detail {

    template <class T>
    struct is_basic_string_span_oracle : std11::false_type {};

    template <class T>
    struct is_basic_string_span_oracle<basic_string_span<T>> : std11::true_type {};

    template <class T>
    struct is_basic_string_span : is_basic_string_span_oracle<typename std11::remove_cv<T>::type> {
    };

    template <class T>
    gsl_api inline gsl_constexpr14 std::size_t string_length(T *ptr, std::size_t max) {
        if (ptr == gsl_nullptr || max <= 0)
            return 0;

        std::size_t len = 0;
        while (len < max && ptr[len])  // NOLINT
            ++len;

        return len;
    }

    }  // namespace detail

    //
    // basic_string_span<> - A view of contiguous characters, replace (*,len).
    //
    template <class T>
    class basic_string_span {
    public:
        typedef T element_type;
        typedef span<T> span_type;

        typedef typename span_type::size_type size_type;
        typedef typename span_type::index_type index_type;
        typedef typename span_type::difference_type difference_type;

        typedef typename span_type::pointer pointer;
        typedef typename span_type::reference reference;

        typedef typename span_type::iterator iterator;
        typedef typename span_type::const_iterator const_iterator;
        typedef typename span_type::reverse_iterator reverse_iterator;
        typedef typename span_type::const_reverse_iterator const_reverse_iterator;

        // construction:

#if gsl_HAVE(IS_DEFAULT)
        gsl_constexpr basic_string_span() gsl_noexcept = default;
#else
        gsl_api gsl_constexpr basic_string_span() gsl_noexcept {}
#endif

#if gsl_HAVE(NULLPTR)
        gsl_api gsl_constexpr basic_string_span(std::nullptr_t) gsl_noexcept
                : span_(nullptr, static_cast<index_type>(0)) {}
#endif

#ifdef __CUDACC_RELAXED_CONSTEXPR__
        gsl_api
#endif  // __CUDACC_RELAXED_CONSTEXPR__
                gsl_constexpr
                basic_string_span(pointer ptr)
                : span_(remove_z(ptr, (std::numeric_limits<index_type>::max)())) {
        }

        gsl_api gsl_constexpr basic_string_span(pointer ptr, index_type count)
                : span_(ptr, count) {}

        gsl_api gsl_constexpr basic_string_span(pointer firstElem, pointer lastElem)
                : span_(firstElem, lastElem) {}

        template <std::size_t N>
        gsl_constexpr basic_string_span(element_type (&arr)[N])
                : span_(remove_z(gsl_ADDRESSOF(arr[0]), N)) {}

#if gsl_HAVE(ARRAY)

        template <std::size_t N>
        gsl_constexpr basic_string_span(
                std::array<typename std11::remove_const<element_type>::type, N> &arr)
                : span_(remove_z(arr)) {}

        template <std::size_t N>
        gsl_constexpr basic_string_span(
                std::array<typename std11::remove_const<element_type>::type, N> const &arr)
                : span_(remove_z(arr)) {}

#endif

#if gsl_HAVE(CONSTRAINED_SPAN_CONTAINER_CTOR)

        // Exclude: array, [basic_string,] basic_string_span

        template <class Container gsl_ENABLE_IF_(
                (!detail::is_std_array<Container>::value &&
                 !detail::is_basic_string_span<Container>::value &&
                 std::is_convertible<typename Container::pointer, pointer>::value &&
                 std::is_convertible<typename Container::pointer,
                                     decltype(std::declval<Container>().data())>::value))>
        gsl_constexpr basic_string_span(Container &cont) : span_((cont)) {}

        // Exclude: array, [basic_string,] basic_string_span

        template <class Container gsl_ENABLE_IF_(
                (!detail::is_std_array<Container>::value &&
                 !detail::is_basic_string_span<Container>::value &&
                 std::is_convertible<typename Container::pointer, pointer>::value &&
                 std::is_convertible<typename Container::pointer,
                                     decltype(std::declval<Container const &>().data())>::value))>
        gsl_constexpr basic_string_span(Container const &cont) : span_((cont)) {}

#elif gsl_HAVE(UNCONSTRAINED_SPAN_CONTAINER_CTOR)

        template <class Container>
        gsl_constexpr basic_string_span(Container &cont) : span_(cont) {}

        template <class Container>
        gsl_constexpr basic_string_span(Container const &cont) : span_(cont) {}

#else

        template <class U>
        gsl_api gsl_constexpr basic_string_span(span<U> const &rhs) : span_(rhs) {}

#endif

#if gsl_FEATURE_TO_STD(WITH_CONTAINER)

        template <class Container>
        gsl_constexpr basic_string_span(with_container_t, Container &cont)
                : span_(with_container, cont) {}
#endif

#if gsl_HAVE(IS_DEFAULT)
#if gsl_BETWEEN(gsl_COMPILER_GNUC_VERSION, 440, 600)
        gsl_constexpr basic_string_span(basic_string_span const &) = default;

        gsl_constexpr basic_string_span(basic_string_span &&) = default;
#else
        gsl_constexpr basic_string_span(basic_string_span const &) gsl_noexcept = default;

        gsl_constexpr basic_string_span(basic_string_span &&) gsl_noexcept = default;
#endif
#endif

        template <class U gsl_ENABLE_IF_(
                (std::is_convertible<typename basic_string_span<U>::pointer, pointer>::value))>
        gsl_api gsl_constexpr basic_string_span(basic_string_span<U> const &rhs)
                : span_(reinterpret_cast<pointer>(rhs.data()), rhs.length())  // NOLINT
        {}

#if gsl_STDLIB_CPP11_120
        template <class U gsl_ENABLE_IF_(
                (std::is_convertible<typename basic_string_span<U>::pointer, pointer>::value))>
        gsl_api gsl_constexpr basic_string_span(basic_string_span<U> &&rhs)
                : span_(reinterpret_cast<pointer>(rhs.data()), rhs.length())  // NOLINT
        {}
#endif  // gsl_STDLIB_CPP11_120

        template <class CharTraits, class Allocator>
        gsl_constexpr basic_string_span(
                std::basic_string<typename std11::remove_const<element_type>::type,
                                  CharTraits,
                                  Allocator> &str)
                : span_(gsl_ADDRESSOF(str[0]), str.length()) {}

        template <class CharTraits, class Allocator>
        gsl_constexpr basic_string_span(
                std::basic_string<typename std11::remove_const<element_type>::type,
                                  CharTraits,
                                  Allocator> const &str)
                : span_(gsl_ADDRESSOF(str[0]), str.length()) {}

        // assignment:

#if gsl_HAVE(IS_DEFAULT)
        gsl_constexpr14 basic_string_span &operator=(basic_string_span const &)
                gsl_noexcept = default;

        gsl_constexpr14 basic_string_span &operator=(basic_string_span &&) gsl_noexcept = default;
#endif

        // sub span:

        /*gsl_api*/  // currently disabled due to an apparent NVCC bug
        gsl_NODISCARD gsl_constexpr14 basic_string_span first(index_type count) const {
            return span_.first(count);
        }

        /*gsl_api*/  // currently disabled due to an apparent NVCC bug
        gsl_NODISCARD gsl_constexpr14 basic_string_span last(index_type count) const {
            return span_.last(count);
        }

        /*gsl_api*/  // currently disabled due to an apparent NVCC bug
        gsl_NODISCARD gsl_constexpr14 basic_string_span subspan(index_type offset) const {
            return span_.subspan(offset);
        }

        /*gsl_api*/  // currently disabled due to an apparent NVCC bug
        gsl_NODISCARD gsl_constexpr14 basic_string_span subspan(index_type offset,
                                                                index_type count) const {
            return span_.subspan(offset, count);
        }

        // observers:

        gsl_NODISCARD gsl_api gsl_constexpr index_type length() const gsl_noexcept {
            return span_.size();
        }

        gsl_NODISCARD gsl_api gsl_constexpr index_type size() const gsl_noexcept {
            return span_.size();
        }

        gsl_NODISCARD gsl_api gsl_constexpr index_type length_bytes() const gsl_noexcept {
            return span_.size_bytes();
        }

        gsl_NODISCARD gsl_api gsl_constexpr index_type size_bytes() const gsl_noexcept {
            return span_.size_bytes();
        }

        gsl_NODISCARD gsl_api gsl_constexpr bool empty() const gsl_noexcept { return size() == 0; }

        gsl_NODISCARD gsl_api gsl_constexpr14 reference operator[](index_type idx) const {
            return span_[idx];
        }

#if !gsl_DEPRECATE_TO_LEVEL(6)
        gsl_DEPRECATED_MSG("use subscript indexing instead") gsl_api gsl_constexpr14 reference
        operator()(index_type idx) const {
            return span_[idx];
        }
#endif  // deprecate

        gsl_NODISCARD gsl_api gsl_constexpr14 reference front() const { return span_.front(); }

        gsl_NODISCARD gsl_api gsl_constexpr14 reference back() const { return span_.back(); }

        gsl_NODISCARD gsl_api gsl_constexpr pointer data() const gsl_noexcept {
            return span_.data();
        }

        gsl_NODISCARD gsl_api gsl_constexpr iterator begin() const gsl_noexcept {
            return span_.begin();
        }

        gsl_NODISCARD gsl_api gsl_constexpr iterator end() const gsl_noexcept {
            return span_.end();
        }

        gsl_NODISCARD gsl_constexpr17 reverse_iterator rbegin() const gsl_noexcept {
            return span_.rbegin();
        }

        gsl_NODISCARD gsl_constexpr17 reverse_iterator rend() const gsl_noexcept {
            return span_.rend();
        }

        // const version not in p0123r2:

        gsl_NODISCARD gsl_api gsl_constexpr const_iterator cbegin() const gsl_noexcept {
            return span_.cbegin();
        }

        gsl_NODISCARD gsl_api gsl_constexpr const_iterator cend() const gsl_noexcept {
            return span_.cend();
        }

        gsl_NODISCARD gsl_constexpr17 const_reverse_iterator crbegin() const gsl_noexcept {
            return span_.crbegin();
        }

        gsl_NODISCARD gsl_constexpr17 const_reverse_iterator crend() const gsl_noexcept {
            return span_.crend();
        }

    private:
        gsl_api static gsl_constexpr14 span_type remove_z(pointer sz, std::size_t max) {
            return span_type(sz, detail::string_length(sz, max));
        }

#if gsl_HAVE(ARRAY)
        template <size_t N>
        gsl_NODISCARD static gsl_constexpr14 span_type
        remove_z(std::array<typename std11::remove_const<element_type>::type, N> &arr) {
            return remove_z(gsl_ADDRESSOF(arr[0]), narrow_cast<std::size_t>(N));
        }

        template <size_t N>
        gsl_NODISCARD static gsl_constexpr14 span_type
        remove_z(std::array<typename std11::remove_const<element_type>::type, N> const &arr) {
            return remove_z(gsl_ADDRESSOF(arr[0]), narrow_cast<std::size_t>(N));
        }
#endif

    private:
        span_type span_;
    };

    // basic_string_span comparison functions:

#if gsl_CONFIG(ALLOWS_NONSTRICT_SPAN_COMPARISON)

    template <class T, class U>
    gsl_SUPPRESS_MSGSL_WARNING(stl .1) gsl_NODISCARD inline gsl_constexpr14 bool operator==(
            basic_string_span<T> const &l, U const &u) gsl_noexcept {
        const basic_string_span<typename std11::add_const<T>::type> r(u);

        return l.size() == r.size() && std98::equal(l.begin(), l.end(), r.begin());
    }

    template <class T, class U>
    gsl_SUPPRESS_MSGSL_WARNING(stl .1) gsl_NODISCARD inline gsl_constexpr14 bool operator<(
            basic_string_span<T> const &l, U const &u) gsl_noexcept {
        const basic_string_span<typename std11::add_const<T>::type> r(u);

        return std98::lexicographical_compare(l.begin(), l.end(), r.begin(), r.end());
    }

#if gsl_HAVE(DEFAULT_FUNCTION_TEMPLATE_ARG)

    template <class T, class U gsl_ENABLE_IF_((!detail::is_basic_string_span<U>::value))>
    gsl_SUPPRESS_MSGSL_WARNING(stl .1) gsl_NODISCARD inline gsl_constexpr14 bool operator==(
            U const &u, basic_string_span<T> const &r) gsl_noexcept {
        const basic_string_span<typename std11::add_const<T>::type> l(u);

        return l.size() == r.size() && std98::equal(l.begin(), l.end(), r.begin());
    }

    template <class T, class U gsl_ENABLE_IF_((!detail::is_basic_string_span<U>::value))>
    gsl_SUPPRESS_MSGSL_WARNING(stl .1) gsl_NODISCARD inline gsl_constexpr14 bool operator<(
            U const &u, basic_string_span<T> const &r) gsl_noexcept {
        const basic_string_span<typename std11::add_const<T>::type> l(u);

        return std98::lexicographical_compare(l.begin(), l.end(), r.begin(), r.end());
    }
#endif

#else  // gsl_CONFIG( ALLOWS_NONSTRICT_SPAN_COMPARISON )

    template <class T>
    gsl_SUPPRESS_MSGSL_WARNING(stl .1) gsl_NODISCARD inline gsl_constexpr14 bool operator==(
            basic_string_span<T> const &l, basic_string_span<T> const &r) gsl_noexcept {
        return l.size() == r.size() && std98::equal(l.begin(), l.end(), r.begin());
    }

    template <class T>
    gsl_SUPPRESS_MSGSL_WARNING(stl .1) gsl_NODISCARD inline gsl_constexpr14 bool operator<(
            basic_string_span<T> const &l, basic_string_span<T> const &r) gsl_noexcept {
        return std98::lexicographical_compare(l.begin(), l.end(), r.begin(), r.end());
    }

#endif  // gsl_CONFIG( ALLOWS_NONSTRICT_SPAN_COMPARISON )

    template <class T, class U>
    gsl_NODISCARD inline gsl_constexpr14 bool operator!=(basic_string_span<T> const &l, U const &r)
            gsl_noexcept {
        return !(l == r);
    }

    template <class T, class U>
    gsl_NODISCARD inline gsl_constexpr14 bool operator<=(basic_string_span<T> const &l, U const &r)
            gsl_noexcept {
#if gsl_HAVE(DEFAULT_FUNCTION_TEMPLATE_ARG) || !gsl_CONFIG(ALLOWS_NONSTRICT_SPAN_COMPARISON)
        return !(r < l);
#else
        basic_string_span<typename std11::add_const<T>::type> rr(r);
        return !(rr < l);
#endif
    }

    template <class T, class U>
    gsl_NODISCARD inline gsl_constexpr14 bool operator>(basic_string_span<T> const &l, U const &r)
            gsl_noexcept {
#if gsl_HAVE(DEFAULT_FUNCTION_TEMPLATE_ARG) || !gsl_CONFIG(ALLOWS_NONSTRICT_SPAN_COMPARISON)
        return (r < l);
#else
        basic_string_span<typename std11::add_const<T>::type> rr(r);
        return (rr < l);
#endif
    }

    template <class T, class U>
    gsl_NODISCARD inline gsl_constexpr14 bool operator>=(basic_string_span<T> const &l, U const &r)
            gsl_noexcept {
        return !(l < r);
    }

#if gsl_HAVE(DEFAULT_FUNCTION_TEMPLATE_ARG)

    template <class T, class U gsl_ENABLE_IF_((!detail::is_basic_string_span<U>::value))>
    gsl_NODISCARD inline gsl_constexpr14 bool operator!=(U const &l, basic_string_span<T> const &r)
            gsl_noexcept {
        return !(l == r);
    }

    template <class T, class U gsl_ENABLE_IF_((!detail::is_basic_string_span<U>::value))>
    gsl_NODISCARD inline gsl_constexpr14 bool operator<=(U const &l, basic_string_span<T> const &r)
            gsl_noexcept {
        return !(r < l);
    }

    template <class T, class U gsl_ENABLE_IF_((!detail::is_basic_string_span<U>::value))>
    gsl_NODISCARD inline gsl_constexpr14 bool operator>(U const &l, basic_string_span<T> const &r)
            gsl_noexcept {
        return (r < l);
    }

    template <class T, class U gsl_ENABLE_IF_((!detail::is_basic_string_span<U>::value))>
    gsl_NODISCARD inline gsl_constexpr14 bool operator>=(U const &l, basic_string_span<T> const &r)
            gsl_noexcept {
        return !(l < r);
    }

#endif  // gsl_HAVE( DEFAULT_FUNCTION_TEMPLATE_ARG )

    // convert basic_string_span to byte span:

    template <class T>
    gsl_NODISCARD gsl_api inline span<const byte> as_bytes(basic_string_span<T> spn) gsl_noexcept {
        return span<const byte>(reinterpret_cast<const byte *>(spn.data()),
                                spn.size_bytes());  // NOLINT
    }

    //
    // String types:
    //

    typedef char *zstring;
    typedef const char *czstring;

#if gsl_HAVE(WCHAR)
    typedef wchar_t *wzstring;
    typedef const wchar_t *cwzstring;
#endif

    typedef basic_string_span<char> string_span;
    typedef basic_string_span<char const> cstring_span;

#if gsl_HAVE(WCHAR)
    typedef basic_string_span<wchar_t> wstring_span;
    typedef basic_string_span<wchar_t const> cwstring_span;
#endif

    // to_string() allow (explicit) conversions from string_span to string

#if 0

template< class T >
inline std::basic_string< typename std::remove_const<T>::type > to_string( basic_string_span<T> spn )
{
     std::string( spn.data(), spn.length() );
}

#else

    gsl_NODISCARD inline std::string to_string(string_span const &spn) {
        return std::string(spn.data(), static_cast<std::size_t>(spn.length()));
    }

    gsl_NODISCARD inline std::string to_string(cstring_span const &spn) {
        return std::string(spn.data(), static_cast<std::size_t>(spn.length()));
    }

#if gsl_HAVE(WCHAR)

    gsl_NODISCARD inline std::wstring to_string(wstring_span const &spn) {
        return std::wstring(spn.data(), static_cast<std::size_t>(spn.length()));
    }

    gsl_NODISCARD inline std::wstring to_string(cwstring_span const &spn) {
        return std::wstring(spn.data(), static_cast<std::size_t>(spn.length()));
    }

#endif  // gsl_HAVE( WCHAR )
#endif  // to_string()

    //
    // Stream output for string_span types
    //

    namespace detail {

    template <class Stream>
    void write_padding(Stream &os, std::streamsize n) {
        for (std::streamsize i = 0; i < n; ++i)
            os.rdbuf()->sputc(os.fill());
    }

    template <class Stream, class Span>
    Stream &write_to_stream(Stream &os, Span const &spn) {
        typename Stream::sentry sentry(os);

        if (!os)
            return os;

        const std::streamsize length = gsl::narrow_failfast<std::streamsize>(spn.length());

        // Whether, and how, to pad
        const bool pad = (length < os.width());
        const bool left_pad =
                pad && (os.flags() & std::ios_base::adjustfield) == std::ios_base::right;

        if (left_pad)
            detail::write_padding(os, os.width() - length);

        // Write span characters
        os.rdbuf()->sputn(spn.begin(), length);

        if (pad && !left_pad)
            detail::write_padding(os, os.width() - length);

        // Reset output stream width
        os.width(0);

        return os;
    }

    }  // namespace detail

    template <typename Traits>
    std::basic_ostream<char, Traits> &operator<<(std::basic_ostream<char, Traits> &os,
                                                 string_span const &spn) {
        return detail::write_to_stream(os, spn);
    }

    template <typename Traits>
    std::basic_ostream<char, Traits> &operator<<(std::basic_ostream<char, Traits> &os,
                                                 cstring_span const &spn) {
        return detail::write_to_stream(os, spn);
    }

#if gsl_HAVE(WCHAR)

    template <typename Traits>
    std::basic_ostream<wchar_t, Traits> &operator<<(std::basic_ostream<wchar_t, Traits> &os,
                                                    wstring_span const &spn) {
        return detail::write_to_stream(os, spn);
    }

    template <typename Traits>
    std::basic_ostream<wchar_t, Traits> &operator<<(std::basic_ostream<wchar_t, Traits> &os,
                                                    cwstring_span const &spn) {
        return detail::write_to_stream(os, spn);
    }

#endif  // gsl_HAVE( WCHAR )

    //
    // ensure_sentinel()
    //
    // Provides a way to obtain a span from a contiguous sequence
    // that ends with a (non-inclusive) sentinel value.
    //
    // Will fail-fast if sentinel cannot be found before max elements are
    // examined.
    //
    namespace detail {

    template <class T, class SizeType, const T Sentinel>
    gsl_constexpr14 static span<T> ensure_sentinel(
            T *seq,
            SizeType max = (std::numeric_limits<SizeType>::max)()) {
        typedef T *pointer;

        gsl_SUPPRESS_MSVC_WARNING(26429,
                                  "f.23: symbol 'cur' is never tested for "
                                  "nullness, it can be marked as not_null") pointer cur = seq;

        while (static_cast<SizeType>(cur - seq) < max && *cur != Sentinel)
            ++cur;

        gsl_Expects(*cur == Sentinel);

        return span<T>(seq, gsl::narrow_cast<typename span<T>::index_type>(cur - seq));
    }
    }  // namespace detail

    //
    // ensure_z - creates a string_span for a czstring or cwzstring.
    // Will fail fast if a null-terminator cannot be found before
    // the limit of size_type.
    //

    template <class T>
    gsl_NODISCARD inline gsl_constexpr14 span<T> ensure_z(
            T *const &sz, size_t max = (std::numeric_limits<size_t>::max)()) {
        return detail::ensure_sentinel<T, size_t, 0>(sz, max);
    }

    template <class T, size_t N>
    gsl_NODISCARD inline gsl_constexpr14 span<T> ensure_z(T(&sz)[N]) {
        return ::gsl::ensure_z(gsl_ADDRESSOF(sz[0]), N);
    }

#if gsl_HAVE(TYPE_TRAITS)

    template <class Container>
    gsl_NODISCARD inline gsl_constexpr14
            span<typename std::remove_pointer<typename Container::pointer>::type>
            ensure_z(Container & cont) {
        return ::gsl::ensure_z(cont.data(), cont.length());
    }
#endif

    //
    // basic_zstring_span<> - A view of contiguous null-terminated characters,
    // replace (*,len).
    //

    template <typename T>
    class basic_zstring_span {
    public:
        typedef T element_type;
        typedef span<T> span_type;

        typedef typename span_type::index_type index_type;
        typedef typename span_type::difference_type difference_type;

        typedef element_type *czstring_type;
        typedef basic_string_span<element_type> string_span_type;

        gsl_api gsl_constexpr14 basic_zstring_span(span_type s) : span_(s) {
            // expects a zero-terminated span
            gsl_Expects(s.back() == '\0');
        }

#if gsl_HAVE(IS_DEFAULT)
        gsl_constexpr basic_zstring_span(basic_zstring_span const &) = default;
        gsl_constexpr basic_zstring_span(basic_zstring_span &&) = default;
        gsl_constexpr14 basic_zstring_span &operator=(basic_zstring_span const &) = default;
        gsl_constexpr14 basic_zstring_span &operator=(basic_zstring_span &&) = default;
#else
        gsl_api gsl_constexpr basic_zstring_span(basic_zstring_span const &other)
                : span_(other.span_) {}
        gsl_api gsl_constexpr basic_zstring_span &operator=(basic_zstring_span const &other) {
            span_ = other.span_;
            return *this;
        }
#endif

        gsl_NODISCARD gsl_api gsl_constexpr bool empty() const gsl_noexcept { return false; }

        gsl_NODISCARD gsl_api gsl_constexpr string_span_type as_string_span() const gsl_noexcept {
            return string_span_type(span_.data(), span_.size() - 1);
        }

        /*gsl_api*/  // currently disabled due to an apparent NVCC bug
        gsl_NODISCARD gsl_constexpr string_span_type ensure_z() const {
            return ::gsl::ensure_z(span_.data(), span_.size());
        }

        gsl_NODISCARD gsl_api gsl_constexpr czstring_type assume_z() const gsl_noexcept {
            return span_.data();
        }

    private:
        span_type span_;
    };

    //
    // zString types:
    //

    typedef basic_zstring_span<char> zstring_span;
    typedef basic_zstring_span<char const> czstring_span;

#if gsl_HAVE(WCHAR)
    typedef basic_zstring_span<wchar_t> wzstring_span;
    typedef basic_zstring_span<wchar_t const> cwzstring_span;
#endif

}  // namespace gsl

#if gsl_HAVE(HASH)

//
// std::hash specializations for GSL types
//

namespace gsl {

namespace detail {

//
// Helper struct for std::hash specializations
//

template <bool Condition>
struct conditionally_enabled_hash {};

// disabled as described in [unord.hash]
template <>
struct conditionally_enabled_hash<false> {
    gsl_is_delete_access : conditionally_enabled_hash() gsl_is_delete;
    conditionally_enabled_hash(conditionally_enabled_hash const &) gsl_is_delete;
    conditionally_enabled_hash(conditionally_enabled_hash &&) gsl_is_delete;
    conditionally_enabled_hash &operator=(conditionally_enabled_hash const &) gsl_is_delete;
    conditionally_enabled_hash &operator=(conditionally_enabled_hash &&) gsl_is_delete;
};

}  // namespace detail

}  // namespace gsl

namespace std {

template <class T>
struct hash<::gsl::not_null<T>> : public ::gsl::detail::conditionally_enabled_hash<
                                          is_default_constructible<hash<T>>::value> {
public:
    gsl_NODISCARD gsl_constexpr std::size_t operator()(::gsl::not_null<T> const &v) const
    // hash function is not `noexcept` because `as_nullable()` has preconditions
    {
        return hash<T>()(::gsl::as_nullable(v));
    }
};
template <class T>
struct hash<::gsl::not_null<T *>> {
public:
    gsl_NODISCARD gsl_constexpr std::size_t operator()(::gsl::not_null<T *> const &v) const
            gsl_noexcept {
        return hash<T *>()(::gsl::as_nullable(v));
    }
};

template <>
struct hash<::gsl::byte> {
public:
    gsl_NODISCARD gsl_constexpr std::size_t operator()(::gsl::byte v) const gsl_noexcept {
        return ::gsl::to_integer<std::size_t>(v);
    }
};

}  // namespace std

#endif  // gsl_HAVE( HASH )

#if gsl_FEATURE(GSL_LITE_NAMESPACE)

// gsl_lite namespace:

// gsl-lite currently keeps all symbols in the namespace `gsl`. The `gsl_lite`
// namespace contains all the symbols in the `gsl` namespace, plus some
// extensions that are not specified in the Core Guidelines.
//
// Going forward, we want to support coexistence of gsl-lite with M-GSL, so we
// want to encourage using the `gsl_lite` namespace when consuming gsl-lite.
// Typical use in library code would be:
//
//     #include <gsl-lite/gsl-lite.hpp>  // instead of <gsl/gsl-lite.hpp>
//
//     namespace foo {
//         namespace gsl = ::gsl_lite;  // convenience alias
//         double mean( gsl::span<double const> elements )
//         {
//             gsl_Expects( ! elements.empty() );  // instead of Expects()
//             ...
//         }
//     } // namespace foo
//
// In a future version, the new <gsl-lite/gsl-lite.hpp> header will only define
// the `gsl_lite` namespace and no unprefixed `Expects()` and `Ensures()` macros
// to avoid collision with M-GSL. To ensure backward compatibility, the old
// header <gsl/gsl-lite.hpp> will keep defining the `gsl` namespace and the
// `Expects()` and `Ensures()` macros.

namespace gsl_lite {

namespace std11 = ::gsl::std11;
namespace std14 = ::gsl::std14;
namespace std17 = ::gsl::std17;
namespace std20 = ::gsl::std20;

using namespace std11;
using namespace std14;
using namespace std17;
using namespace std20;

using namespace ::gsl::detail::no_adl;

#if gsl_HAVE(SHARED_PTR)
using std::make_shared;
using std::shared_ptr;
using std::unique_ptr;
#endif

using ::gsl::diff;
using ::gsl::dim;
using ::gsl::index;
using ::gsl::stride;

#if gsl_HAVE(ALIAS_TEMPLATE)
#if gsl_BETWEEN(gsl_COMPILER_MSVC_VERSION, 1, \
                141)  // VS 2015 and earlier have trouble with `using` for alias \
                      // templates
template <class T
#if gsl_HAVE(TYPE_TRAITS)
          ,
          typename = typename std::enable_if<std::is_pointer<T>::value>::type
#endif
          >
using owner = T;
#else
using ::gsl::owner;
#endif
#endif

using ::gsl::fail_fast;

using ::gsl::finally;
#if gsl_FEATURE(EXPERIMENTAL_RETURN_GUARD)
using ::gsl::on_error;
using ::gsl::on_return;
#endif  // gsl_FEATURE( EXPERIMENTAL_RETURN_GUARD )

using ::gsl::narrow;
using ::gsl::narrow_cast;
using ::gsl::narrow_failfast;
using ::gsl::narrowing_error;

using ::gsl::at;

using ::gsl::make_not_null;
using ::gsl::not_null;
using ::gsl::not_null_ic;

using ::gsl::byte;

using ::gsl::to_byte;
using ::gsl::to_integer;
using ::gsl::to_string;
using ::gsl::to_uchar;

using ::gsl::with_container;
using ::gsl::with_container_t;

using ::gsl::as_bytes;
using ::gsl::as_writable_bytes;
using ::gsl::byte_span;
using ::gsl::copy;
using ::gsl::make_span;
using ::gsl::span;
#if !gsl_DEPRECATE_TO_LEVEL(6)
using ::gsl::as_writeable_bytes;
#endif

using ::gsl::basic_string_span;
using ::gsl::cstring_span;
using ::gsl::string_span;

using ::gsl::basic_zstring_span;
using ::gsl::czstring_span;
using ::gsl::zstring_span;

using ::gsl::czstring;
using ::gsl::zstring;

#if gsl_HAVE(WCHAR)
using ::gsl::cwzstring;
using ::gsl::wzstring;

using ::gsl::cwzstring_span;
using ::gsl::wzstring_span;
#endif  // gsl_HAVE( WCHAR )

using ::gsl::ensure_z;

}  // namespace gsl_lite

#endif  // gsl_FEATURE( GSL_LITE_NAMESPACE )

gsl_RESTORE_MSVC_WARNINGS()

// #undef internal macros
#undef gsl_STATIC_ASSERT_
#undef gsl_ENABLE_IF_
#undef gsl_TRAILING_RETURN_TYPE_
#undef gsl_RETURN_DECLTYPE_

#endif  // GSL_GSL_LITE_HPP_INCLUDED

        // end of file


================================================
FILE: third_party/include/gsl.h
================================================
//
// gsl-lite is based on GSL: Guidelines Support Library.
// For more information see https://github.com/gsl-lite/gsl-lite
//
// Copyright (c) 2015 Martin Moene
// Copyright (c) 2015 Microsoft Corporation. All rights reserved.
//
// This code is licensed under the MIT License (MIT).
//
// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
// IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
// FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
// AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
// LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
// OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
// THE SOFTWARE.

// mimic MS include hierarchy

#ifndef GSL_GSL_H_INCLUDED
#define GSL_GSL_H_INCLUDED

#pragma message("gsl.h is deprecated since version 0.27.0, use gsl/gsl-lite.hpp instead.")

#include "gsl/gsl-lite.hpp"

#endif  // GSL_GSL_H_INCLUDED


================================================
FILE: third_party/jsoncons-0.166-icc-fix.patch
================================================
commit 28c56b90ec7337f98a5b8942574590111a5e5831
Author: Alex Merry <alex.merry@nanoporetech.com>
Date:   Wed Aug 4 15:40:53 2021 +0100

    Make implementation_type public in container types

    This is used by jsoncons::type_traits::detail::basic_json_t in certain
    circumstances, and ICC does not like that it is not publicly accessible.

    Fixes compilation errors like:

    jsoncons/basic_json.hpp(49):
    error #525: type "jsoncons::json_object<KeyT, Json,
    std::enable_if<std::is_same<Json::implementation_policy::key_order,
    jsoncons::sort_key_order>::value, void>::type>::implementation_policy
    [with KeyT=std::basic_string<char, std::char_traits<char>,
    std::allocator<char>>, Json=jsoncons::basic_json<char,
    jsoncons::sorted_policy, std::allocator<char>>]" (declared at line 541
    of "jsoncons/json_container_types.hpp")
    is an inaccessible type (allowed for cfront compatibility)
    basic_json_t = basic_json<typename T::char_type,typename
    T::implementation_policy,typename T::allocator_type>;
    detected during:
        instantiation of type
        "jsoncons::type_traits::detail::basic_json_t<
        jsoncons::json_object<std::basic_string<char,
        std::char_traits<char>, std::allocator<char>>,
        jsoncons::basic_json<char, jsoncons::sorted_policy,
        std::allocator<char>>, void>>" at line 182 of
        "jsoncons/more_type_traits.hpp"

diff --git a/include/jsoncons/json_container_types.hpp b/include/jsoncons/json_container_types.hpp
index afe10d4..ced66e6 100644
--- a/include/jsoncons/json_container_types.hpp
+++ b/include/jsoncons/json_container_types.hpp
@@ -32,8 +32,8 @@ namespace jsoncons {
     public:
         using allocator_type = typename Json::allocator_type;
         using value_type = Json;
-    private:
         using implementation_policy = typename Json::implementation_policy;
+    private:
         using value_allocator_type = typename std::allocator_traits<allocator_type>:: template rebind_alloc<value_type>;
         using value_container_type = typename implementation_policy::template sequence_container_type<value_type,value_allocator_type>;
         value_container_type elements_;
@@ -537,8 +537,8 @@ namespace jsoncons {
         using key_value_type = key_value<KeyT,Json>;
         using char_type = typename Json::char_type;
         using string_view_type = typename Json::string_view_type;
-    private:
         using implementation_policy = typename Json::implementation_policy;
+    private:
         using key_value_allocator_type = typename std::allocator_traits<allocator_type>:: template rebind_alloc<key_value_type>;
         using key_value_container_type = typename implementation_policy::template sequence_container_type<key_value_type,key_value_allocator_type>;

@@ -1235,8 +1235,8 @@ namespace jsoncons {
         //using mapped_type = Json;
         using string_view_type = typename Json::string_view_type;
         using key_value_type = key_value<KeyT,Json>;
-    private:
         using implementation_policy = typename Json::implementation_policy;
+    private:
         using key_value_allocator_type = typename std::allocator_traits<allocator_type>:: template rebind_alloc<key_value_type>;
         using key_value_container_type = typename implementation_policy::template sequence_container_type<key_value_type,key_value_allocator_type>;
         typedef typename std::allocator_traits<allocator_type>:: template rebind_alloc<std::size_t> index_allocator_type;


================================================
FILE: third_party/licenses/catch2.txt
================================================
Boost Software License - Version 1.0 - August 17th, 2003

Permission is hereby granted, free of charge, to any person or organization
obtaining a copy of the software and accompanying documentation covered by
this license (the "Software") to use, reproduce, display, distribute,
execute, and transmit the Software, and to prepare derivative works of the
Software, and to permit third-parties to whom the Software is furnished to
do so, all subject to the following:

The copyright notices in the Software and this entire statement, including
the above license grant, this restriction and the following disclaimer,
must be included in all copies of the Software, in whole or in part, and
all derivative works of the Software, unless such copies or derivative
works are solely in the form of machine-executable object code generated by
a source language processor.

THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE, TITLE AND NON-INFRINGEMENT. IN NO EVENT
SHALL THE COPYRIGHT HOLDERS OR ANYONE DISTRIBUTING THE SOFTWARE BE LIABLE
FOR ANY DAMAGES OR OTHER LIABILITY, WHETHER IN CONTRACT, TORT OR OTHERWISE,
ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
DEALINGS IN THE SOFTWARE.


================================================
FILE: third_party/licenses/gsl-lite.txt
================================================
The MIT License (MIT)

Copyright (c) 2015 Martin Moene
Copyright (c) 2015 Microsoft Corporation. All rights reserved.

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the "Software"), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in all
copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
SOFTWARE.


================================================
FILE: third_party/software_versions.yaml
================================================
# Structure:
# <name (use correct capitalisation, spaces, etc - quote if necessary)>:
#     version: "<what version is included>"
#     license: "<path to a file in the licenses dir>"
#     files:
#         - shell-style globs of files in include
#
# This information is both useful to developers and used to build third-party software information
# documents to include in our distributions (many open source licenses require this, and it's
# generally a good thing to do regardless).
#
# The license file should ideally be copied directly from the source distribution.
#
# The "files" field is used by the CI jobs to check that this file has been assembled correctly, and
# we didn't forget any licenses.
---
Catch2:
    description: >
        Unit testing framework. Nicer to use than most other C++ unit testing frameworks.
    # Omitted from third-party license files because it's not in any shipped code
    omit: True
    version: "2.13.7"
    url: https://github.com/catchorg/Catch2
    license: licenses/catch2.txt
    files:
        - include/catch2/catch.hpp
GSL Lite:
    description: >
        Functions and types suggested for use by the C++ Core Guidelines
        <https://github.com/isocpp/CppCoreGuidelines>. In the future we may want to switch to
        Microsoft's implementation <https://github.com/microsoft/gsl>, but that doesn't support
        GCC 4.8.
    version: "0.38.1"
    url: https://github.com/martinmoene/gsl-lite
    license: licenses/gsl-lite.txt
    files:
        - include/gsl.h
        - include/gsl
pybind11:
    description: >
        pybind11 is a lightweight header-only library that exposes C++ types in Python
        and vice versa, mainly to create Python bindings of existing C++ code.
    version: "2.10.1"
    url: https://github.com/pybind/pybind11
    license: licenses/pybind11.txt
    files:
        - include/pybind11/*